Slamseq iBet spikeIn Max P paper

In [43]:
from __future__ import print_function
import os.path
import pandas as pd
import sys
sys.path.insert(0, '../../')
import seaborn as sns
import numpy as np

from JKBio.Helper import *
from JKBio.helper import pyDESeq2

from bokeh.plotting import *
from bokeh.models import HoverTool
import matplotlib.pyplot as plt

from sklearn.neighbors import KNeighborsClassifier
from sklearn.manifold import MDS, TSNE
from sklearn.decomposition import PCA
from sklearn.preprocessing import scale
#from umap import UMAP

output_notebook()
%load_ext autoreload
%matplotlib inline
%autoreload 2
%load_ext rpy2.ipython
Loading BokehJS ...
The autoreload extension is already loaded. To reload it, use:
  %reload_ext autoreload
The rpy2.ipython extension is already loaded. To reload it, use:
  %reload_ext rpy2.ipython

downloading their data

downloading the data

In [545]:
version="vAll"
project="slamseqMax"
location= '../data/'+project+"/"
In [4]:
mkdir ../$location
In [30]:
!gsutil ls gs://transfer-amlproject/200827_MP8179_fastq/
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_10_MP8179_S169_R1_001_fastqc.html
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_10_MP8179_S169_R1_001_fastqc.zip
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_10_MP8179_S169_R2_001_fastqc.html
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_10_MP8179_S169_R2_001_fastqc.zip
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_11_MP8179_S170_R1_001_fastqc.html
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_11_MP8179_S170_R1_001_fastqc.zip
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_11_MP8179_S170_R2_001_fastqc.html
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_11_MP8179_S170_R2_001_fastqc.zip
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_12_MP8179_S171_R1_001_fastqc.html
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_12_MP8179_S171_R1_001_fastqc.zip
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_12_MP8179_S171_R2_001_fastqc.html
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_12_MP8179_S171_R2_001_fastqc.zip
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_13_MP8179_S172_R1_001_fastqc.html
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_13_MP8179_S172_R1_001_fastqc.zip
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_13_MP8179_S172_R2_001_fastqc.html
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_13_MP8179_S172_R2_001_fastqc.zip
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_14_MP8179_S173_R1_001_fastqc.html
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_14_MP8179_S173_R1_001_fastqc.zip
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_14_MP8179_S173_R2_001_fastqc.html
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_14_MP8179_S173_R2_001_fastqc.zip
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_15_MP8179_S174_R1_001_fastqc.html
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_15_MP8179_S174_R1_001_fastqc.zip
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_15_MP8179_S174_R2_001_fastqc.html
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_15_MP8179_S174_R2_001_fastqc.zip
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_16_MP8179_S175_R1_001_fastqc.html
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_16_MP8179_S175_R1_001_fastqc.zip
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_16_MP8179_S175_R2_001_fastqc.html
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_16_MP8179_S175_R2_001_fastqc.zip
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_17_MP8179_S176_R1_001_fastqc.html
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_17_MP8179_S176_R1_001_fastqc.zip
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_17_MP8179_S176_R2_001_fastqc.html
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_17_MP8179_S176_R2_001_fastqc.zip
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_18_MP8179_S177_R1_001_fastqc.html
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_18_MP8179_S177_R1_001_fastqc.zip
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_18_MP8179_S177_R2_001_fastqc.html
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_18_MP8179_S177_R2_001_fastqc.zip
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_19_MP8179_S178_R1_001_fastqc.html
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_19_MP8179_S178_R1_001_fastqc.zip
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_19_MP8179_S178_R2_001_fastqc.html
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_19_MP8179_S178_R2_001_fastqc.zip
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_1_MP8179_S160_R1_001_fastqc.html
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_1_MP8179_S160_R1_001_fastqc.zip
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_1_MP8179_S160_R2_001_fastqc.html
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_1_MP8179_S160_R2_001_fastqc.zip
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_20_MP8179_S179_R1_001_fastqc.html
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_20_MP8179_S179_R1_001_fastqc.zip
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_20_MP8179_S179_R2_001_fastqc.html
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_20_MP8179_S179_R2_001_fastqc.zip
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_21_MP8179_S180_R1_001_fastqc.html
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_21_MP8179_S180_R1_001_fastqc.zip
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_21_MP8179_S180_R2_001_fastqc.html
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_21_MP8179_S180_R2_001_fastqc.zip
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_23_MP8179_S181_R1_001_fastqc.html
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_23_MP8179_S181_R1_001_fastqc.zip
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_23_MP8179_S181_R2_001_fastqc.html
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_23_MP8179_S181_R2_001_fastqc.zip
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_24_MP8179_S182_R1_001_fastqc.html
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_24_MP8179_S182_R1_001_fastqc.zip
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_24_MP8179_S182_R2_001_fastqc.html
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_24_MP8179_S182_R2_001_fastqc.zip
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_2_MP8179_S161_R1_001_fastqc.html
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_2_MP8179_S161_R1_001_fastqc.zip
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_2_MP8179_S161_R2_001_fastqc.html
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_2_MP8179_S161_R2_001_fastqc.zip
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_3_MP8179_S162_R1_001_fastqc.html
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_3_MP8179_S162_R1_001_fastqc.zip
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_3_MP8179_S162_R2_001_fastqc.html
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_3_MP8179_S162_R2_001_fastqc.zip
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_4_MP8179_S163_R1_001_fastqc.html
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_4_MP8179_S163_R1_001_fastqc.zip
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_4_MP8179_S163_R2_001_fastqc.html
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_4_MP8179_S163_R2_001_fastqc.zip
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_5_MP8179_S164_R1_001_fastqc.html
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_5_MP8179_S164_R1_001_fastqc.zip
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_5_MP8179_S164_R2_001_fastqc.html
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_5_MP8179_S164_R2_001_fastqc.zip
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_6_MP8179_S165_R1_001_fastqc.html
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_6_MP8179_S165_R1_001_fastqc.zip
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_6_MP8179_S165_R2_001_fastqc.html
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_6_MP8179_S165_R2_001_fastqc.zip
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_7_MP8179_S166_R1_001_fastqc.html
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_7_MP8179_S166_R1_001_fastqc.zip
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_7_MP8179_S166_R2_001_fastqc.html
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_7_MP8179_S166_R2_001_fastqc.zip
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_8_MP8179_S167_R1_001_fastqc.html
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_8_MP8179_S167_R1_001_fastqc.zip
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_8_MP8179_S167_R2_001_fastqc.html
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_8_MP8179_S167_R2_001_fastqc.zip
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_9_MP8179_S168_R1_001_fastqc.html
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_9_MP8179_S168_R1_001_fastqc.zip
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_9_MP8179_S168_R2_001_fastqc.html
gs://transfer-amlproject/200827_MP8179_fastq/Reports/20200827_9_MP8179_S168_R2_001_fastqc.zip
In [24]:
! gsutil -m cp gs://transfer-amlproject/slamseq_inhibitor_spikeins/*MP8179*.fastq.gz ../../data/$project/fastqs/
Copying gs://transfer-amlproject/slamseq_inhibitor_spikeins/20200827_10_MP8179_S169_R1_001.fastq.gz...
Copying gs://transfer-amlproject/slamseq_inhibitor_spikeins/20200827_10_MP8179_S169_R2_001.fastq.gz...
Copying gs://transfer-amlproject/slamseq_inhibitor_spikeins/20200827_11_MP8179_S170_R2_001.fastq.gz...
Copying gs://transfer-amlproject/slamseq_inhibitor_spikeins/20200827_11_MP8179_S170_R1_001.fastq.gz...
Copying gs://transfer-amlproject/slamseq_inhibitor_spikeins/20200827_12_MP8179_S171_R1_001.fastq.gz...
Copying gs://transfer-amlproject/slamseq_inhibitor_spikeins/20200827_12_MP8179_S171_R2_001.fastq.gz...
Copying gs://transfer-amlproject/slamseq_inhibitor_spikeins/20200827_13_MP8179_S172_R1_001.fastq.gz...
Copying gs://transfer-amlproject/slamseq_inhibitor_spikeins/20200827_13_MP8179_S172_R2_001.fastq.gz...
Copying gs://transfer-amlproject/slamseq_inhibitor_spikeins/20200827_14_MP8179_S173_R1_001.fastq.gz...
Copying gs://transfer-amlproject/slamseq_inhibitor_spikeins/20200827_14_MP8179_S173_R2_001.fastq.gz...
Copying gs://transfer-amlproject/slamseq_inhibitor_spikeins/20200827_15_MP8179_S174_R1_001.fastq.gz...
Copying gs://transfer-amlproject/slamseq_inhibitor_spikeins/20200827_15_MP8179_S174_R2_001.fastq.gz...
Copying gs://transfer-amlproject/slamseq_inhibitor_spikeins/20200827_16_MP8179_S175_R1_001.fastq.gz...
Copying gs://transfer-amlproject/slamseq_inhibitor_spikeins/20200827_16_MP8179_S175_R2_001.fastq.gz...
Copying gs://transfer-amlproject/slamseq_inhibitor_spikeins/20200827_17_MP8179_S176_R1_001.fastq.gz...
Copying gs://transfer-amlproject/slamseq_inhibitor_spikeins/20200827_17_MP8179_S176_R2_001.fastq.gz...
Copying gs://transfer-amlproject/slamseq_inhibitor_spikeins/20200827_18_MP8179_S177_R1_001.fastq.gz...
Copying gs://transfer-amlproject/slamseq_inhibitor_spikeins/20200827_18_MP8179_S177_R2_001.fastq.gz...
Copying gs://transfer-amlproject/slamseq_inhibitor_spikeins/20200827_19_MP8179_S178_R1_001.fastq.gz...
Copying gs://transfer-amlproject/slamseq_inhibitor_spikeins/20200827_19_MP8179_S178_R2_001.fastq.gz...
Copying gs://transfer-amlproject/slamseq_inhibitor_spikeins/20200827_1_MP8179_S160_R1_001.fastq.gz...
Copying gs://transfer-amlproject/slamseq_inhibitor_spikeins/20200827_1_MP8179_S160_R2_001.fastq.gz...
Copying gs://transfer-amlproject/slamseq_inhibitor_spikeins/20200827_20_MP8179_S179_R1_001.fastq.gz...
Copying gs://transfer-amlproject/slamseq_inhibitor_spikeins/20200827_20_MP8179_S179_R2_001.fastq.gz...
Copying gs://transfer-amlproject/slamseq_inhibitor_spikeins/20200827_21_MP8179_S180_R1_001.fastq.gz...
Copying gs://transfer-amlproject/slamseq_inhibitor_spikeins/20200827_21_MP8179_S180_R2_001.fastq.gz...
Copying gs://transfer-amlproject/slamseq_inhibitor_spikeins/20200827_23_MP8179_S181_R1_001.fastq.gz...
Copying gs://transfer-amlproject/slamseq_inhibitor_spikeins/20200827_23_MP8179_S181_R2_001.fastq.gz...
Copying gs://transfer-amlproject/slamseq_inhibitor_spikeins/20200827_24_MP8179_S182_R1_001.fastq.gz...
Copying gs://transfer-amlproject/slamseq_inhibitor_spikeins/20200827_24_MP8179_S182_R2_001.fastq.gz...
Copying gs://transfer-amlproject/slamseq_inhibitor_spikeins/20200827_2_MP8179_S161_R1_001.fastq.gz...
Copying gs://transfer-amlproject/slamseq_inhibitor_spikeins/20200827_2_MP8179_S161_R2_001.fastq.gz...
Copying gs://transfer-amlproject/slamseq_inhibitor_spikeins/20200827_3_MP8179_S162_R1_001.fastq.gz...
Copying gs://transfer-amlproject/slamseq_inhibitor_spikeins/20200827_4_MP8179_S163_R1_001.fastq.gz...
Copying gs://transfer-amlproject/slamseq_inhibitor_spikeins/20200827_3_MP8179_S162_R2_001.fastq.gz...
Copying gs://transfer-amlproject/slamseq_inhibitor_spikeins/20200827_4_MP8179_S163_R2_001.fastq.gz...
Copying gs://transfer-amlproject/slamseq_inhibitor_spikeins/20200827_5_MP8179_S164_R1_001.fastq.gz...
Copying gs://transfer-amlproject/slamseq_inhibitor_spikeins/20200827_6_MP8179_S165_R1_001.fastq.gz...
Copying gs://transfer-amlproject/slamseq_inhibitor_spikeins/20200827_5_MP8179_S164_R2_001.fastq.gz...
Copying gs://transfer-amlproject/slamseq_inhibitor_spikeins/20200827_6_MP8179_S165_R2_001.fastq.gz...
Copying gs://transfer-amlproject/slamseq_inhibitor_spikeins/20200827_7_MP8179_S166_R1_001.fastq.gz...
Copying gs://transfer-amlproject/slamseq_inhibitor_spikeins/20200827_7_MP8179_S166_R2_001.fastq.gz...
Copying gs://transfer-amlproject/slamseq_inhibitor_spikeins/20200827_8_MP8179_S167_R1_001.fastq.gz...
Copying gs://transfer-amlproject/slamseq_inhibitor_spikeins/20200827_8_MP8179_S167_R2_001.fastq.gz...
Copying gs://transfer-amlproject/slamseq_inhibitor_spikeins/20200827_9_MP8179_S168_R1_001.fastq.gz...
Copying gs://transfer-amlproject/slamseq_inhibitor_spikeins/20200827_9_MP8179_S168_R2_001.fastq.gz...
Resuming download for ../../data/slamseqMax/fastqs/20200827_4_MP8179_S163_R2_001.fastq.gz component 0
Resuming download for ../../data/slamseqMax/fastqs/20200827_4_MP8179_S163_R2_001.fastq.gz component 1
Resuming download for ../../data/slamseqMax/fastqs/20200827_4_MP8179_S163_R2_001.fastq.gz component 2
Resuming download for ../../data/slamseqMax/fastqs/20200827_4_MP8179_S163_R2_001.fastq.gz component 3
Resuming download for ../../data/slamseqMax/fastqs/20200827_2_MP8179_S161_R1_001.fastq.gz component 0
Resuming download for ../../data/slamseqMax/fastqs/20200827_2_MP8179_S161_R1_001.fastq.gz component 1
Resuming download for ../../data/slamseqMax/fastqs/20200827_2_MP8179_S161_R1_001.fastq.gz component 2
Resuming download for ../../data/slamseqMax/fastqs/20200827_4_MP8179_S163_R1_001.fastq.gz component 0
Resuming download for ../../data/slamseqMax/fastqs/20200827_4_MP8179_S163_R1_001.fastq.gz component 2
Resuming download for ../../data/slamseqMax/fastqs/20200827_4_MP8179_S163_R1_001.fastq.gz component 1
Resuming download for ../../data/slamseqMax/fastqs/20200827_3_MP8179_S162_R1_001.fastq.gz component 0
Resuming download for ../../data/slamseqMax/fastqs/20200827_3_MP8179_S162_R1_001.fastq.gz component 1
Resuming download for ../../data/slamseqMax/fastqs/20200827_3_MP8179_S162_R1_001.fastq.gz component 2
Resuming download for ../../data/slamseqMax/fastqs/20200827_3_MP8179_S162_R2_001.fastq.gz component 0
Resuming download for ../../data/slamseqMax/fastqs/20200827_3_MP8179_S162_R2_001.fastq.gz component 1
Resuming download for ../../data/slamseqMax/fastqs/20200827_3_MP8179_S162_R2_001.fastq.gz component 2
Resuming download for ../../data/slamseqMax/fastqs/20200827_2_MP8179_S161_R1_001.fastq.gz component 3
Resuming download for ../../data/slamseqMax/fastqs/20200827_4_MP8179_S163_R1_001.fastq.gz component 3
Resuming download for ../../data/slamseqMax/fastqs/20200827_3_MP8179_S162_R1_001.fastq.gz component 3
Resuming download for ../../data/slamseqMax/fastqs/20200827_3_MP8179_S162_R2_001.fastq.gz component 3
- [46/46 files][165.1 GiB/165.1 GiB] 100% Done 177.8 MiB/s ETA 00:00:00         
Operation completed over 46 objects/165.1 GiB.                                   
In [21]:
ls ../../data/$project/fastqs
mr193-MV411-MYBi_30m-r1_R1_001.fastq.gz_trimming_report.txt
mr193-MV411-MYBi_30m-r1_R1_001_unpaired_1.fq.gz
mr193-MV411-MYBi_30m-r1_R1_001_val_1.fq.gz
mr193-MV411-MYBi_30m-r1_R2_001.fastq.gz_trimming_report.txt
mr193-MV411-MYBi_30m-r1_R2_001_unpaired_2.fq.gz
mr193-MV411-MYBi_30m-r1_R2_001_val_2.fq.gz
mr194-MV411-MYBi_30m-r2_R1_001.fastq.gz_trimming_report.txt
mr194-MV411-MYBi_30m-r2_R1_001_unpaired_1.fq.gz
mr194-MV411-MYBi_30m-r2_R1_001_val_1.fq.gz
mr194-MV411-MYBi_30m-r2_R2_001.fastq.gz_trimming_report.txt
mr194-MV411-MYBi_30m-r2_R2_001_unpaired_2.fq.gz
mr194-MV411-MYBi_30m-r2_R2_001_val_2.fq.gz
mr195-MV411-MYBi_30m-r3_R1_001.fastq.gz_trimming_report.txt
mr195-MV411-MYBi_30m-r3_R1_001_unpaired_1.fq.gz
mr195-MV411-MYBi_30m-r3_R1_001_val_1.fq.gz
mr195-MV411-MYBi_30m-r3_R2_001.fastq.gz_trimming_report.txt
mr195-MV411-MYBi_30m-r3_R2_001_unpaired_2.fq.gz
mr195-MV411-MYBi_30m-r3_R2_001_val_2.fq.gz
mr196-MV411-MYBi_30m-r4_R1_001.fastq.gz_trimming_report.txt
mr196-MV411-MYBi_30m-r4_R1_001_unpaired_1.fq.gz
mr196-MV411-MYBi_30m-r4_R1_001_val_1.fq.gz
mr196-MV411-MYBi_30m-r4_R2_001.fastq.gz_trimming_report.txt
mr196-MV411-MYBi_30m-r4_R2_001_unpaired_2.fq.gz
mr196-MV411-MYBi_30m-r4_R2_001_val_2.fq.gz
mr197-MV411-PBS_30m-r1_R1_001.fastq.gz_trimming_report.txt
mr197-MV411-PBS_30m-r1_R1_001_unpaired_1.fq.gz
mr197-MV411-PBS_30m-r1_R1_001_val_1.fq.gz
mr197-MV411-PBS_30m-r1_R2_001.fastq.gz_trimming_report.txt
mr197-MV411-PBS_30m-r1_R2_001_unpaired_2.fq.gz
mr197-MV411-PBS_30m-r1_R2_001_val_2.fq.gz
mr198-MV411-PBS_30m-r2_R1_001.fastq.gz_trimming_report.txt
mr198-MV411-PBS_30m-r2_R1_001_unpaired_1.fq.gz
mr198-MV411-PBS_30m-r2_R1_001_val_1.fq.gz
mr198-MV411-PBS_30m-r2_R2_001.fastq.gz_trimming_report.txt
mr198-MV411-PBS_30m-r2_R2_001_unpaired_2.fq.gz
mr198-MV411-PBS_30m-r2_R2_001_val_2.fq.gz
mr199-MV411-PBS_30m-r3_R1_001.fastq.gz_trimming_report.txt
mr199-MV411-PBS_30m-r3_R1_001_unpaired_1.fq.gz
mr199-MV411-PBS_30m-r3_R1_001_val_1.fq.gz
mr199-MV411-PBS_30m-r3_R2_001.fastq.gz_trimming_report.txt
mr199-MV411-PBS_30m-r3_R2_001_unpaired_2.fq.gz
mr199-MV411-PBS_30m-r3_R2_001_val_2.fq.gz
mr200-MV411-PBS_30m-r4_R1_001.fastq.gz_trimming_report.txt
mr200-MV411-PBS_30m-r4_R1_001_unpaired_1.fq.gz
mr200-MV411-PBS_30m-r4_R1_001_val_1.fq.gz
mr200-MV411-PBS_30m-r4_R2_001.fastq.gz_trimming_report.txt
mr200-MV411-PBS_30m-r4_R2_001_unpaired_2.fq.gz
mr200-MV411-PBS_30m-r4_R2_001_val_2.fq.gz
mr201-MV411-MYBi_6h-r1_R1_001.fastq.gz_trimming_report.txt
mr201-MV411-MYBi_6h-r1_R1_001_unpaired_1.fq.gz
mr201-MV411-MYBi_6h-r1_R1_001_val_1.fq.gz
mr201-MV411-MYBi_6h-r1_R2_001.fastq.gz_trimming_report.txt
mr201-MV411-MYBi_6h-r1_R2_001_unpaired_2.fq.gz
mr201-MV411-MYBi_6h-r1_R2_001_val_2.fq.gz
mr202-MV411-MYBi_6h-r2_R1_001.fastq.gz_trimming_report.txt
mr202-MV411-MYBi_6h-r2_R1_001_unpaired_1.fq.gz
mr202-MV411-MYBi_6h-r2_R1_001_val_1.fq.gz
mr202-MV411-MYBi_6h-r2_R2_001.fastq.gz_trimming_report.txt
mr202-MV411-MYBi_6h-r2_R2_001_unpaired_2.fq.gz
mr202-MV411-MYBi_6h-r2_R2_001_val_2.fq.gz
mr203-MV411-MYBi_6h-r3_R1_001.fastq.gz_trimming_report.txt
mr203-MV411-MYBi_6h-r3_R1_001_unpaired_1.fq.gz
mr203-MV411-MYBi_6h-r3_R1_001_val_1.fq.gz
mr203-MV411-MYBi_6h-r3_R2_001.fastq.gz_trimming_report.txt
mr203-MV411-MYBi_6h-r3_R2_001_unpaired_2.fq.gz
mr203-MV411-MYBi_6h-r3_R2_001_val_2.fq.gz
mr204-MV411-MYBi_6h-r4_R1_001.fastq.gz_trimming_report.txt
mr204-MV411-MYBi_6h-r4_R1_001_unpaired_1.fq.gz
mr204-MV411-MYBi_6h-r4_R1_001_val_1.fq.gz
mr204-MV411-MYBi_6h-r4_R2_001.fastq.gz_trimming_report.txt
mr204-MV411-MYBi_6h-r4_R2_001_unpaired_2.fq.gz
mr204-MV411-MYBi_6h-r4_R2_001_val_2.fq.gz
mr205-MV411-PBS_6h-r1_R1_001.fastq.gz_trimming_report.txt
mr205-MV411-PBS_6h-r1_R1_001_unpaired_1.fq.gz
mr205-MV411-PBS_6h-r1_R1_001_val_1.fq.gz
mr205-MV411-PBS_6h-r1_R2_001.fastq.gz_trimming_report.txt
mr205-MV411-PBS_6h-r1_R2_001_unpaired_2.fq.gz
mr205-MV411-PBS_6h-r1_R2_001_val_2.fq.gz
mr206-MV411-PBS_6h-r2_R1_001.fastq.gz_trimming_report.txt
mr206-MV411-PBS_6h-r2_R1_001_unpaired_1.fq.gz
mr206-MV411-PBS_6h-r2_R1_001_val_1.fq.gz
mr206-MV411-PBS_6h-r2_R2_001.fastq.gz_trimming_report.txt
mr206-MV411-PBS_6h-r2_R2_001_unpaired_2.fq.gz
mr206-MV411-PBS_6h-r2_R2_001_val_2.fq.gz
mr207-MV411-PBS_6h-r3_R1_001.fastq.gz_trimming_report.txt
mr207-MV411-PBS_6h-r3_R1_001_unpaired_1.fq.gz
mr207-MV411-PBS_6h-r3_R1_001_val_1.fq.gz
mr207-MV411-PBS_6h-r3_R2_001.fastq.gz_trimming_report.txt
mr207-MV411-PBS_6h-r3_R2_001_unpaired_2.fq.gz
mr207-MV411-PBS_6h-r3_R2_001_val_2.fq.gz
mr208-MV411-MS2-r1_R1_001.fastq.gz_trimming_report.txt
mr208-MV411-MS2-r1_R1_001_unpaired_1.fq.gz
mr208-MV411-MS2-r1_R1_001_val_1.fq.gz
mr208-MV411-MS2-r1_R2_001.fastq.gz_trimming_report.txt
mr208-MV411-MS2-r1_R2_001_unpaired_2.fq.gz
mr208-MV411-MS2-r1_R2_001_val_2.fq.gz
mr209-MV411-MS2-r2_R1_001.fastq.gz_trimming_report.txt
mr209-MV411-MS2-r2_R1_001_unpaired_1.fq.gz
mr209-MV411-MS2-r2_R1_001_val_1.fq.gz
mr209-MV411-MS2-r2_R2_001.fastq.gz_trimming_report.txt
mr209-MV411-MS2-r2_R2_001_unpaired_2.fq.gz
mr209-MV411-MS2-r2_R2_001_val_2.fq.gz
mr210-MV411-MS2-r3_R1_001.fastq.gz_trimming_report.txt
mr210-MV411-MS2-r3_R1_001_unpaired_1.fq.gz
mr210-MV411-MS2-r3_R1_001_val_1.fq.gz
mr210-MV411-MS2-r3_R2_001.fastq.gz_trimming_report.txt
mr210-MV411-MS2-r3_R2_001_unpaired_2.fq.gz
mr210-MV411-MS2-r3_R2_001_val_2.fq.gz
mr211-MV411-JQ1-r1_R1_001.fastq.gz_trimming_report.txt
mr211-MV411-JQ1-r1_R1_001_unpaired_1.fq.gz
mr211-MV411-JQ1-r1_R1_001_val_1.fq.gz
mr211-MV411-JQ1-r1_R2_001.fastq.gz_trimming_report.txt
mr211-MV411-JQ1-r1_R2_001_unpaired_2.fq.gz
mr211-MV411-JQ1-r1_R2_001_val_2.fq.gz
mr212-MV411-JQ1-r2_R1_001.fastq.gz_trimming_report.txt
mr212-MV411-JQ1-r2_R1_001_unpaired_1.fq.gz
mr212-MV411-JQ1-r2_R1_001_val_1.fq.gz
mr212-MV411-JQ1-r2_R2_001.fastq.gz_trimming_report.txt
mr212-MV411-JQ1-r2_R2_001_unpaired_2.fq.gz
mr212-MV411-JQ1-r2_R2_001_val_2.fq.gz
mr213-MV411-JQ1-r3_R1_001.fastq.gz_trimming_report.txt
mr213-MV411-JQ1-r3_R1_001_unpaired_1.fq.gz
mr213-MV411-JQ1-r3_R1_001_val_1.fq.gz
mr213-MV411-JQ1-r3_R2_001.fastq.gz_trimming_report.txt
mr213-MV411-JQ1-r3_R2_001_unpaired_2.fq.gz
mr213-MV411-JQ1-r3_R2_001_val_2.fq.gz
mr214-MV411-MS2_JQ1-r1_R1_001.fastq.gz_trimming_report.txt
mr214-MV411-MS2_JQ1-r1_R1_001_unpaired_1.fq.gz
mr214-MV411-MS2_JQ1-r1_R1_001_val_1.fq.gz
mr214-MV411-MS2_JQ1-r1_R2_001.fastq.gz_trimming_report.txt
mr214-MV411-MS2_JQ1-r1_R2_001_unpaired_2.fq.gz
mr214-MV411-MS2_JQ1-r1_R2_001_val_2.fq.gz
mr215-MV411-MS2_JQ1-r2_R1_001.fastq.gz_trimming_report.txt
mr215-MV411-MS2_JQ1-r2_R1_001_unpaired_1.fq.gz
mr215-MV411-MS2_JQ1-r2_R1_001_val_1.fq.gz
mr215-MV411-MS2_JQ1-r2_R2_001.fastq.gz_trimming_report.txt
mr215-MV411-MS2_JQ1-r2_R2_001_unpaired_2.fq.gz
mr215-MV411-MS2_JQ1-r2_R2_001_val_2.fq.gz
mr216-MV411-MS2_JQ1-r3_R1_001.fastq.gz_trimming_report.txt
mr216-MV411-MS2_JQ1-r3_R1_001_unpaired_1.fq.gz
mr216-MV411-MS2_JQ1-r3_R1_001_val_1.fq.gz
mr216-MV411-MS2_JQ1-r3_R2_001.fastq.gz_trimming_report.txt
mr216-MV411-MS2_JQ1-r3_R2_001_unpaired_2.fq.gz
mr216-MV411-MS2_JQ1-r3_R2_001_val_2.fq.gz
mr217-MV411-DMSO-r1_R1_001.fastq.gz_trimming_report.txt
mr217-MV411-DMSO-r1_R1_001_unpaired_1.fq.gz
mr217-MV411-DMSO-r1_R1_001_val_1.fq.gz
mr217-MV411-DMSO-r1_R2_001.fastq.gz_trimming_report.txt
mr217-MV411-DMSO-r1_R2_001_unpaired_2.fq.gz
mr217-MV411-DMSO-r1_R2_001_val_2.fq.gz
mr218-MV411-DMSO-r2_R1_001.fastq.gz_trimming_report.txt
mr218-MV411-DMSO-r2_R1_001_unpaired_1.fq.gz
mr218-MV411-DMSO-r2_R1_001_val_1.fq.gz
mr218-MV411-DMSO-r2_R2_001.fastq.gz_trimming_report.txt
mr218-MV411-DMSO-r2_R2_001_unpaired_2.fq.gz
mr218-MV411-DMSO-r2_R2_001_val_2.fq.gz
mr219-MV411-DMSO-r3_R1_001.fastq.gz_trimming_report.txt
mr219-MV411-DMSO-r3_R1_001_unpaired_1.fq.gz
mr219-MV411-DMSO-r3_R1_001_val_1.fq.gz
mr219-MV411-DMSO-r3_R2_001.fastq.gz_trimming_report.txt
mr219-MV411-DMSO-r3_R2_001_unpaired_2.fq.gz
mr219-MV411-DMSO-r3_R2_001_val_2.fq.gz

Running slamdunk

In [ ]:
#if need to download the data from sra
! mkdir ../../data/slam/MYCpaper && cd ../../data/slam/MYCpaper && fastq_dump SRR5806781 && fastq_dump SRR5806783 && fastq_dump SRR5806785 &&
fastq_dump SRR5806780 && fastq_dump SRR5806782 && fastq_dump SRR5806784 && cd -
In [32]:
folder_bams = "../../data/"+project+'/fastqs'
bams = ! ls $folder_bams/*
bams
Out[32]:
['../../data/slamseqMax/fastqs/20200827_10_MP8179_S169_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs/20200827_10_MP8179_S169_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs/20200827_11_MP8179_S170_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs/20200827_11_MP8179_S170_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs/20200827_12_MP8179_S171_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs/20200827_12_MP8179_S171_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs/20200827_13_MP8179_S172_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs/20200827_13_MP8179_S172_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs/20200827_14_MP8179_S173_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs/20200827_14_MP8179_S173_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs/20200827_15_MP8179_S174_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs/20200827_15_MP8179_S174_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs/20200827_16_MP8179_S175_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs/20200827_16_MP8179_S175_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs/20200827_17_MP8179_S176_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs/20200827_17_MP8179_S176_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs/20200827_18_MP8179_S177_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs/20200827_18_MP8179_S177_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs/20200827_19_MP8179_S178_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs/20200827_19_MP8179_S178_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs/20200827_1_MP8179_S160_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs/20200827_1_MP8179_S160_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs/20200827_20_MP8179_S179_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs/20200827_20_MP8179_S179_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs/20200827_21_MP8179_S180_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs/20200827_21_MP8179_S180_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs/20200827_23_MP8179_S181_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs/20200827_23_MP8179_S181_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs/20200827_24_MP8179_S182_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs/20200827_24_MP8179_S182_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs/20200827_2_MP8179_S161_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs/20200827_2_MP8179_S161_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs/20200827_3_MP8179_S162_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs/20200827_3_MP8179_S162_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs/20200827_4_MP8179_S163_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs/20200827_4_MP8179_S163_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs/20200827_5_MP8179_S164_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs/20200827_5_MP8179_S164_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs/20200827_6_MP8179_S165_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs/20200827_6_MP8179_S165_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs/20200827_7_MP8179_S166_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs/20200827_7_MP8179_S166_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs/20200827_8_MP8179_S167_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs/20200827_8_MP8179_S167_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs/20200827_9_MP8179_S168_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs/20200827_9_MP8179_S168_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs/mr193-MV411-MYBi_30m-r1_R1_001.fastq.gz_trimming_report.txt',
 '../../data/slamseqMax/fastqs/mr193-MV411-MYBi_30m-r1_R1_001_unpaired_1.fq.gz',
 '../../data/slamseqMax/fastqs/mr193-MV411-MYBi_30m-r1_R1_001_val_1.fq.gz',
 '../../data/slamseqMax/fastqs/mr193-MV411-MYBi_30m-r1_R2_001.fastq.gz_trimming_report.txt',
 '../../data/slamseqMax/fastqs/mr193-MV411-MYBi_30m-r1_R2_001_unpaired_2.fq.gz',
 '../../data/slamseqMax/fastqs/mr193-MV411-MYBi_30m-r1_R2_001_val_2.fq.gz',
 '../../data/slamseqMax/fastqs/mr194-MV411-MYBi_30m-r2_R1_001.fastq.gz_trimming_report.txt',
 '../../data/slamseqMax/fastqs/mr194-MV411-MYBi_30m-r2_R1_001_unpaired_1.fq.gz',
 '../../data/slamseqMax/fastqs/mr194-MV411-MYBi_30m-r2_R1_001_val_1.fq.gz',
 '../../data/slamseqMax/fastqs/mr194-MV411-MYBi_30m-r2_R2_001.fastq.gz_trimming_report.txt',
 '../../data/slamseqMax/fastqs/mr194-MV411-MYBi_30m-r2_R2_001_unpaired_2.fq.gz',
 '../../data/slamseqMax/fastqs/mr194-MV411-MYBi_30m-r2_R2_001_val_2.fq.gz',
 '../../data/slamseqMax/fastqs/mr195-MV411-MYBi_30m-r3_R1_001.fastq.gz_trimming_report.txt',
 '../../data/slamseqMax/fastqs/mr195-MV411-MYBi_30m-r3_R1_001_unpaired_1.fq.gz',
 '../../data/slamseqMax/fastqs/mr195-MV411-MYBi_30m-r3_R1_001_val_1.fq.gz',
 '../../data/slamseqMax/fastqs/mr195-MV411-MYBi_30m-r3_R2_001.fastq.gz_trimming_report.txt',
 '../../data/slamseqMax/fastqs/mr195-MV411-MYBi_30m-r3_R2_001_unpaired_2.fq.gz',
 '../../data/slamseqMax/fastqs/mr195-MV411-MYBi_30m-r3_R2_001_val_2.fq.gz',
 '../../data/slamseqMax/fastqs/mr196-MV411-MYBi_30m-r4_R1_001.fastq.gz_trimming_report.txt',
 '../../data/slamseqMax/fastqs/mr196-MV411-MYBi_30m-r4_R1_001_unpaired_1.fq.gz',
 '../../data/slamseqMax/fastqs/mr196-MV411-MYBi_30m-r4_R1_001_val_1.fq.gz',
 '../../data/slamseqMax/fastqs/mr196-MV411-MYBi_30m-r4_R2_001.fastq.gz_trimming_report.txt',
 '../../data/slamseqMax/fastqs/mr196-MV411-MYBi_30m-r4_R2_001_unpaired_2.fq.gz',
 '../../data/slamseqMax/fastqs/mr196-MV411-MYBi_30m-r4_R2_001_val_2.fq.gz',
 '../../data/slamseqMax/fastqs/mr197-MV411-PBS_30m-r1_R1_001.fastq.gz_trimming_report.txt',
 '../../data/slamseqMax/fastqs/mr197-MV411-PBS_30m-r1_R1_001_unpaired_1.fq.gz',
 '../../data/slamseqMax/fastqs/mr197-MV411-PBS_30m-r1_R1_001_val_1.fq.gz',
 '../../data/slamseqMax/fastqs/mr197-MV411-PBS_30m-r1_R2_001.fastq.gz_trimming_report.txt',
 '../../data/slamseqMax/fastqs/mr197-MV411-PBS_30m-r1_R2_001_unpaired_2.fq.gz',
 '../../data/slamseqMax/fastqs/mr197-MV411-PBS_30m-r1_R2_001_val_2.fq.gz',
 '../../data/slamseqMax/fastqs/mr198-MV411-PBS_30m-r2_R1_001.fastq.gz_trimming_report.txt',
 '../../data/slamseqMax/fastqs/mr198-MV411-PBS_30m-r2_R1_001_unpaired_1.fq.gz',
 '../../data/slamseqMax/fastqs/mr198-MV411-PBS_30m-r2_R1_001_val_1.fq.gz',
 '../../data/slamseqMax/fastqs/mr198-MV411-PBS_30m-r2_R2_001.fastq.gz_trimming_report.txt',
 '../../data/slamseqMax/fastqs/mr198-MV411-PBS_30m-r2_R2_001_unpaired_2.fq.gz',
 '../../data/slamseqMax/fastqs/mr198-MV411-PBS_30m-r2_R2_001_val_2.fq.gz',
 '../../data/slamseqMax/fastqs/mr199-MV411-PBS_30m-r3_R1_001.fastq.gz_trimming_report.txt',
 '../../data/slamseqMax/fastqs/mr199-MV411-PBS_30m-r3_R1_001_unpaired_1.fq.gz',
 '../../data/slamseqMax/fastqs/mr199-MV411-PBS_30m-r3_R1_001_val_1.fq.gz',
 '../../data/slamseqMax/fastqs/mr199-MV411-PBS_30m-r3_R2_001.fastq.gz_trimming_report.txt',
 '../../data/slamseqMax/fastqs/mr199-MV411-PBS_30m-r3_R2_001_unpaired_2.fq.gz',
 '../../data/slamseqMax/fastqs/mr199-MV411-PBS_30m-r3_R2_001_val_2.fq.gz',
 '../../data/slamseqMax/fastqs/mr200-MV411-PBS_30m-r4_R1_001.fastq.gz_trimming_report.txt',
 '../../data/slamseqMax/fastqs/mr200-MV411-PBS_30m-r4_R1_001_unpaired_1.fq.gz',
 '../../data/slamseqMax/fastqs/mr200-MV411-PBS_30m-r4_R1_001_val_1.fq.gz',
 '../../data/slamseqMax/fastqs/mr200-MV411-PBS_30m-r4_R2_001.fastq.gz_trimming_report.txt',
 '../../data/slamseqMax/fastqs/mr200-MV411-PBS_30m-r4_R2_001_unpaired_2.fq.gz',
 '../../data/slamseqMax/fastqs/mr200-MV411-PBS_30m-r4_R2_001_val_2.fq.gz',
 '../../data/slamseqMax/fastqs/mr201-MV411-MYBi_6h-r1_R1_001.fastq.gz_trimming_report.txt',
 '../../data/slamseqMax/fastqs/mr201-MV411-MYBi_6h-r1_R1_001_unpaired_1.fq.gz',
 '../../data/slamseqMax/fastqs/mr201-MV411-MYBi_6h-r1_R1_001_val_1.fq.gz',
 '../../data/slamseqMax/fastqs/mr201-MV411-MYBi_6h-r1_R2_001.fastq.gz_trimming_report.txt',
 '../../data/slamseqMax/fastqs/mr201-MV411-MYBi_6h-r1_R2_001_unpaired_2.fq.gz',
 '../../data/slamseqMax/fastqs/mr201-MV411-MYBi_6h-r1_R2_001_val_2.fq.gz',
 '../../data/slamseqMax/fastqs/mr202-MV411-MYBi_6h-r2_R1_001.fastq.gz_trimming_report.txt',
 '../../data/slamseqMax/fastqs/mr202-MV411-MYBi_6h-r2_R1_001_unpaired_1.fq.gz',
 '../../data/slamseqMax/fastqs/mr202-MV411-MYBi_6h-r2_R1_001_val_1.fq.gz',
 '../../data/slamseqMax/fastqs/mr202-MV411-MYBi_6h-r2_R2_001.fastq.gz_trimming_report.txt',
 '../../data/slamseqMax/fastqs/mr202-MV411-MYBi_6h-r2_R2_001_unpaired_2.fq.gz',
 '../../data/slamseqMax/fastqs/mr202-MV411-MYBi_6h-r2_R2_001_val_2.fq.gz',
 '../../data/slamseqMax/fastqs/mr203-MV411-MYBi_6h-r3_R1_001.fastq.gz_trimming_report.txt',
 '../../data/slamseqMax/fastqs/mr203-MV411-MYBi_6h-r3_R1_001_unpaired_1.fq.gz',
 '../../data/slamseqMax/fastqs/mr203-MV411-MYBi_6h-r3_R1_001_val_1.fq.gz',
 '../../data/slamseqMax/fastqs/mr203-MV411-MYBi_6h-r3_R2_001.fastq.gz_trimming_report.txt',
 '../../data/slamseqMax/fastqs/mr203-MV411-MYBi_6h-r3_R2_001_unpaired_2.fq.gz',
 '../../data/slamseqMax/fastqs/mr203-MV411-MYBi_6h-r3_R2_001_val_2.fq.gz',
 '../../data/slamseqMax/fastqs/mr204-MV411-MYBi_6h-r4_R1_001.fastq.gz_trimming_report.txt',
 '../../data/slamseqMax/fastqs/mr204-MV411-MYBi_6h-r4_R1_001_unpaired_1.fq.gz',
 '../../data/slamseqMax/fastqs/mr204-MV411-MYBi_6h-r4_R1_001_val_1.fq.gz',
 '../../data/slamseqMax/fastqs/mr204-MV411-MYBi_6h-r4_R2_001.fastq.gz_trimming_report.txt',
 '../../data/slamseqMax/fastqs/mr204-MV411-MYBi_6h-r4_R2_001_unpaired_2.fq.gz',
 '../../data/slamseqMax/fastqs/mr204-MV411-MYBi_6h-r4_R2_001_val_2.fq.gz',
 '../../data/slamseqMax/fastqs/mr205-MV411-PBS_6h-r1_R1_001.fastq.gz_trimming_report.txt',
 '../../data/slamseqMax/fastqs/mr205-MV411-PBS_6h-r1_R1_001_unpaired_1.fq.gz',
 '../../data/slamseqMax/fastqs/mr205-MV411-PBS_6h-r1_R1_001_val_1.fq.gz',
 '../../data/slamseqMax/fastqs/mr205-MV411-PBS_6h-r1_R2_001.fastq.gz_trimming_report.txt',
 '../../data/slamseqMax/fastqs/mr205-MV411-PBS_6h-r1_R2_001_unpaired_2.fq.gz',
 '../../data/slamseqMax/fastqs/mr205-MV411-PBS_6h-r1_R2_001_val_2.fq.gz',
 '../../data/slamseqMax/fastqs/mr206-MV411-PBS_6h-r2_R1_001.fastq.gz_trimming_report.txt',
 '../../data/slamseqMax/fastqs/mr206-MV411-PBS_6h-r2_R1_001_unpaired_1.fq.gz',
 '../../data/slamseqMax/fastqs/mr206-MV411-PBS_6h-r2_R1_001_val_1.fq.gz',
 '../../data/slamseqMax/fastqs/mr206-MV411-PBS_6h-r2_R2_001.fastq.gz_trimming_report.txt',
 '../../data/slamseqMax/fastqs/mr206-MV411-PBS_6h-r2_R2_001_unpaired_2.fq.gz',
 '../../data/slamseqMax/fastqs/mr206-MV411-PBS_6h-r2_R2_001_val_2.fq.gz',
 '../../data/slamseqMax/fastqs/mr207-MV411-PBS_6h-r3_R1_001.fastq.gz_trimming_report.txt',
 '../../data/slamseqMax/fastqs/mr207-MV411-PBS_6h-r3_R1_001_unpaired_1.fq.gz',
 '../../data/slamseqMax/fastqs/mr207-MV411-PBS_6h-r3_R1_001_val_1.fq.gz',
 '../../data/slamseqMax/fastqs/mr207-MV411-PBS_6h-r3_R2_001.fastq.gz_trimming_report.txt',
 '../../data/slamseqMax/fastqs/mr207-MV411-PBS_6h-r3_R2_001_unpaired_2.fq.gz',
 '../../data/slamseqMax/fastqs/mr207-MV411-PBS_6h-r3_R2_001_val_2.fq.gz',
 '../../data/slamseqMax/fastqs/mr208-MV411-MS2-r1_R1_001.fastq.gz_trimming_report.txt',
 '../../data/slamseqMax/fastqs/mr208-MV411-MS2-r1_R1_001_unpaired_1.fq.gz',
 '../../data/slamseqMax/fastqs/mr208-MV411-MS2-r1_R1_001_val_1.fq.gz',
 '../../data/slamseqMax/fastqs/mr208-MV411-MS2-r1_R2_001.fastq.gz_trimming_report.txt',
 '../../data/slamseqMax/fastqs/mr208-MV411-MS2-r1_R2_001_unpaired_2.fq.gz',
 '../../data/slamseqMax/fastqs/mr208-MV411-MS2-r1_R2_001_val_2.fq.gz',
 '../../data/slamseqMax/fastqs/mr209-MV411-MS2-r2_R1_001.fastq.gz_trimming_report.txt',
 '../../data/slamseqMax/fastqs/mr209-MV411-MS2-r2_R1_001_unpaired_1.fq.gz',
 '../../data/slamseqMax/fastqs/mr209-MV411-MS2-r2_R1_001_val_1.fq.gz',
 '../../data/slamseqMax/fastqs/mr209-MV411-MS2-r2_R2_001.fastq.gz_trimming_report.txt',
 '../../data/slamseqMax/fastqs/mr209-MV411-MS2-r2_R2_001_unpaired_2.fq.gz',
 '../../data/slamseqMax/fastqs/mr209-MV411-MS2-r2_R2_001_val_2.fq.gz',
 '../../data/slamseqMax/fastqs/mr210-MV411-MS2-r3_R1_001.fastq.gz_trimming_report.txt',
 '../../data/slamseqMax/fastqs/mr210-MV411-MS2-r3_R1_001_unpaired_1.fq.gz',
 '../../data/slamseqMax/fastqs/mr210-MV411-MS2-r3_R1_001_val_1.fq.gz',
 '../../data/slamseqMax/fastqs/mr210-MV411-MS2-r3_R2_001.fastq.gz_trimming_report.txt',
 '../../data/slamseqMax/fastqs/mr210-MV411-MS2-r3_R2_001_unpaired_2.fq.gz',
 '../../data/slamseqMax/fastqs/mr210-MV411-MS2-r3_R2_001_val_2.fq.gz',
 '../../data/slamseqMax/fastqs/mr211-MV411-JQ1-r1_R1_001.fastq.gz_trimming_report.txt',
 '../../data/slamseqMax/fastqs/mr211-MV411-JQ1-r1_R1_001_unpaired_1.fq.gz',
 '../../data/slamseqMax/fastqs/mr211-MV411-JQ1-r1_R1_001_val_1.fq.gz',
 '../../data/slamseqMax/fastqs/mr211-MV411-JQ1-r1_R2_001.fastq.gz_trimming_report.txt',
 '../../data/slamseqMax/fastqs/mr211-MV411-JQ1-r1_R2_001_unpaired_2.fq.gz',
 '../../data/slamseqMax/fastqs/mr211-MV411-JQ1-r1_R2_001_val_2.fq.gz',
 '../../data/slamseqMax/fastqs/mr212-MV411-JQ1-r2_R1_001.fastq.gz_trimming_report.txt',
 '../../data/slamseqMax/fastqs/mr212-MV411-JQ1-r2_R1_001_unpaired_1.fq.gz',
 '../../data/slamseqMax/fastqs/mr212-MV411-JQ1-r2_R1_001_val_1.fq.gz',
 '../../data/slamseqMax/fastqs/mr212-MV411-JQ1-r2_R2_001.fastq.gz_trimming_report.txt',
 '../../data/slamseqMax/fastqs/mr212-MV411-JQ1-r2_R2_001_unpaired_2.fq.gz',
 '../../data/slamseqMax/fastqs/mr212-MV411-JQ1-r2_R2_001_val_2.fq.gz',
 '../../data/slamseqMax/fastqs/mr213-MV411-JQ1-r3_R1_001.fastq.gz_trimming_report.txt',
 '../../data/slamseqMax/fastqs/mr213-MV411-JQ1-r3_R1_001_unpaired_1.fq.gz',
 '../../data/slamseqMax/fastqs/mr213-MV411-JQ1-r3_R1_001_val_1.fq.gz',
 '../../data/slamseqMax/fastqs/mr213-MV411-JQ1-r3_R2_001.fastq.gz_trimming_report.txt',
 '../../data/slamseqMax/fastqs/mr213-MV411-JQ1-r3_R2_001_unpaired_2.fq.gz',
 '../../data/slamseqMax/fastqs/mr213-MV411-JQ1-r3_R2_001_val_2.fq.gz',
 '../../data/slamseqMax/fastqs/mr214-MV411-MS2_JQ1-r1_R1_001.fastq.gz_trimming_report.txt',
 '../../data/slamseqMax/fastqs/mr214-MV411-MS2_JQ1-r1_R1_001_unpaired_1.fq.gz',
 '../../data/slamseqMax/fastqs/mr214-MV411-MS2_JQ1-r1_R1_001_val_1.fq.gz',
 '../../data/slamseqMax/fastqs/mr214-MV411-MS2_JQ1-r1_R2_001.fastq.gz_trimming_report.txt',
 '../../data/slamseqMax/fastqs/mr214-MV411-MS2_JQ1-r1_R2_001_unpaired_2.fq.gz',
 '../../data/slamseqMax/fastqs/mr214-MV411-MS2_JQ1-r1_R2_001_val_2.fq.gz',
 '../../data/slamseqMax/fastqs/mr215-MV411-MS2_JQ1-r2_R1_001.fastq.gz_trimming_report.txt',
 '../../data/slamseqMax/fastqs/mr215-MV411-MS2_JQ1-r2_R1_001_unpaired_1.fq.gz',
 '../../data/slamseqMax/fastqs/mr215-MV411-MS2_JQ1-r2_R1_001_val_1.fq.gz',
 '../../data/slamseqMax/fastqs/mr215-MV411-MS2_JQ1-r2_R2_001.fastq.gz_trimming_report.txt',
 '../../data/slamseqMax/fastqs/mr215-MV411-MS2_JQ1-r2_R2_001_unpaired_2.fq.gz',
 '../../data/slamseqMax/fastqs/mr215-MV411-MS2_JQ1-r2_R2_001_val_2.fq.gz',
 '../../data/slamseqMax/fastqs/mr216-MV411-MS2_JQ1-r3_R1_001.fastq.gz_trimming_report.txt',
 '../../data/slamseqMax/fastqs/mr216-MV411-MS2_JQ1-r3_R1_001_unpaired_1.fq.gz',
 '../../data/slamseqMax/fastqs/mr216-MV411-MS2_JQ1-r3_R1_001_val_1.fq.gz',
 '../../data/slamseqMax/fastqs/mr216-MV411-MS2_JQ1-r3_R2_001.fastq.gz_trimming_report.txt',
 '../../data/slamseqMax/fastqs/mr216-MV411-MS2_JQ1-r3_R2_001_unpaired_2.fq.gz',
 '../../data/slamseqMax/fastqs/mr216-MV411-MS2_JQ1-r3_R2_001_val_2.fq.gz',
 '../../data/slamseqMax/fastqs/mr217-MV411-DMSO-r1_R1_001.fastq.gz_trimming_report.txt',
 '../../data/slamseqMax/fastqs/mr217-MV411-DMSO-r1_R1_001_unpaired_1.fq.gz',
 '../../data/slamseqMax/fastqs/mr217-MV411-DMSO-r1_R1_001_val_1.fq.gz',
 '../../data/slamseqMax/fastqs/mr217-MV411-DMSO-r1_R2_001.fastq.gz_trimming_report.txt',
 '../../data/slamseqMax/fastqs/mr217-MV411-DMSO-r1_R2_001_unpaired_2.fq.gz',
 '../../data/slamseqMax/fastqs/mr217-MV411-DMSO-r1_R2_001_val_2.fq.gz',
 '../../data/slamseqMax/fastqs/mr218-MV411-DMSO-r2_R1_001.fastq.gz_trimming_report.txt',
 '../../data/slamseqMax/fastqs/mr218-MV411-DMSO-r2_R1_001_unpaired_1.fq.gz',
 '../../data/slamseqMax/fastqs/mr218-MV411-DMSO-r2_R1_001_val_1.fq.gz',
 '../../data/slamseqMax/fastqs/mr218-MV411-DMSO-r2_R2_001.fastq.gz_trimming_report.txt',
 '../../data/slamseqMax/fastqs/mr218-MV411-DMSO-r2_R2_001_unpaired_2.fq.gz',
 '../../data/slamseqMax/fastqs/mr218-MV411-DMSO-r2_R2_001_val_2.fq.gz',
 '../../data/slamseqMax/fastqs/mr219-MV411-DMSO-r3_R1_001.fastq.gz_trimming_report.txt',
 '../../data/slamseqMax/fastqs/mr219-MV411-DMSO-r3_R1_001_unpaired_1.fq.gz',
 '../../data/slamseqMax/fastqs/mr219-MV411-DMSO-r3_R1_001_val_1.fq.gz',
 '../../data/slamseqMax/fastqs/mr219-MV411-DMSO-r3_R2_001.fastq.gz_trimming_report.txt',
 '../../data/slamseqMax/fastqs/mr219-MV411-DMSO-r3_R2_001_unpaired_2.fq.gz',
 '../../data/slamseqMax/fastqs/mr219-MV411-DMSO-r3_R2_001_val_2.fq.gz']
In [31]:
rename = {
"20200707_1_MP8000_S65": "mr193-MV411-MYBi_30m-r1",
"20200707_2_MP8000_S66": "mr194-MV411-MYBi_30m-r2",
"20200707_3_MP8000_S67": "mr195-MV411-MYBi_30m-r3",
"20200707_4_MP8000_S68": "mr196-MV411-MYBi_30m-r4",
"20200707_5_MP8000_S69": "mr197-MV411-PBS_30m-r1",
"20200707_6_MP8000_S70": "mr198-MV411-PBS_30m-r2",
"20200707_7_MP8000_S71": "mr199-MV411-PBS_30m-r3",
"20200707_8_MP8000_S72": "mr200-MV411-PBS_30m-r4",
"20200707_9_MP8000_S73": "mr201-MV411-MYBi_6h-r1",
"20200707_10_MP8000_S74": "mr202-MV411-MYBi_6h-r2",
"20200707_11_MP8000_S75": "mr203-MV411-MYBi_6h-r3",
"20200707_12_MP8000_S76": "mr204-MV411-MYBi_6h-r4",
"20200707_13_MP8000_S77": "mr205-MV411-PBS_6h-r1",
"20200707_14_MP8000_S78": "mr206-MV411-PBS_6h-r2",
"20200707_15_MP8000_S79": "mr207-MV411-PBS_6h-r3",
"20200703_16_MP800_S103": "mr208-MV411-MS2-r1",
"20200703_17_MP800_S104": "mr209-MV411-MS2-r2",
"20200703_18_MP800_S105": "mr210-MV411-MS2-r3",
"20200703_19_MP800_S106": "mr211-MV411-JQ1-r1",
"20200703_20_MP800_S107": "mr212-MV411-JQ1-r2",
"20200703_21_MP800_S108": "mr213-MV411-JQ1-r3",
"20200703_22_MP800_S109": "mr214-MV411-MS2_JQ1-r1",
"20200703_23_MP800_S110": "mr215-MV411-MS2_JQ1-r2",
"20200703_24_MP800_S111": "mr216-MV411-MS2_JQ1-r3",
"20200703_25_MP800_S112": "mr217-MV411-DMSO-r1",
"20200703_26_MP800_S113": "mr218-MV411-DMSO-r2",
"20200703_27_MP800_S114": "mr219-MV411-DMSO-r3",
"20200827_1_MP8179_S160": "mr252-MV411_MEF2D-DMSO_2h-r1",
"20200827_2_MP8179_S161": "mr253-MV411_MEF2D-DMSO_2h-r2",
"20200827_3_MP8179_S162": "mr254-MV411_MEF2D-DMSO_2h-r3",
"20200827_4_MP8179_S163": "mr255-MV411_MEF2D-DMSO_2h-r4",
"20200827_5_MP8179_S164": "mr256-MV411_MEF2D-VHL_2h-r1",
"20200827_6_MP8179_S165": "mr257-MV411_MEF2D-VHL_2h-r2",
"20200827_7_MP8179_S166": "mr258-MV411_MEF2D-VHL_2h-r3",
"20200827_8_MP8179_S167": "mr259-MV411_MEF2D-VHL_2h-r4",
"20200827_9_MP8179_S168": "mr260-MV411_MEF2D-DMSO_24h-r1",
"20200827_10_MP8179_S169": "mr261-MV411_MEF2D-DMSO_24h-r2",
"20200827_11_MP8179_S170": "mr262-MV411_MEF2D-DMSO_24h-r3",
"20200827_12_MP8179_S171": "mr263-MV411_MEF2D-DMSO_24h-r4",
"20200827_13_MP8179_S172": "mr264-MV411_MEF2D-VHL_24h-r1",
"20200827_14_MP8179_S173": "mr265-MV411_MEF2D-VHL_24h-r2",
"20200827_15_MP8179_S174": "mr266-MV411_MEF2D-VHL_24h-r3",
"20200827_16_MP8179_S175": "mr267-MV411_MEF2D-VHL_24h-r4",
"20200827_17_MP8179_S176": "mr268-MV411-PBS_24h-r1",
"20200827_18_MP8179_S177": "mr269-MV411-PBS_24h-r2",
"20200827_19_MP8179_S178": "mr270-MV411-PBS_24h-r3",
"20200827_20_MP8179_S179": "mr271-MV411-PBS_24h-r4",
"20200827_21_MP8179_S180": "mr272-MV411-MYBi_24h-r1",
"20200827_23_MP8179_S181": "mr273-MV411-MYBi_24h-r2",
"20200827_24_MP8179_S182": "mr274-MV411-MYBi_24h-r3",
}
In [34]:
for val in bams:
    ren  = val
    for old, new in rename.items():
        ren = ren.replace(old, new)
    if ren !=val:
        ! mv $val $ren
In [35]:
folder="../../data/"+project
folder_bams = folder+'/fastqs/'
bams = ! ls $folder_bams/*.fastq.gz
bams
Out[35]:
['../../data/slamseqMax/fastqs//mr252-MV411_MEF2D-DMSO_2h-r1_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr252-MV411_MEF2D-DMSO_2h-r1_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr253-MV411_MEF2D-DMSO_2h-r2_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr253-MV411_MEF2D-DMSO_2h-r2_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr254-MV411_MEF2D-DMSO_2h-r3_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr254-MV411_MEF2D-DMSO_2h-r3_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr255-MV411_MEF2D-DMSO_2h-r4_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr255-MV411_MEF2D-DMSO_2h-r4_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr256-MV411_MEF2D-VHL_2h-r1_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr256-MV411_MEF2D-VHL_2h-r1_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr257-MV411_MEF2D-VHL_2h-r2_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr257-MV411_MEF2D-VHL_2h-r2_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr258-MV411_MEF2D-VHL_2h-r3_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr258-MV411_MEF2D-VHL_2h-r3_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr259-MV411_MEF2D-VHL_2h-r4_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr259-MV411_MEF2D-VHL_2h-r4_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr260-MV411_MEF2D-DMSO_24h-r1_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr260-MV411_MEF2D-DMSO_24h-r1_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr261-MV411_MEF2D-DMSO_24h-r2_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr261-MV411_MEF2D-DMSO_24h-r2_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr262-MV411_MEF2D-DMSO_24h-r3_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr262-MV411_MEF2D-DMSO_24h-r3_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr263-MV411_MEF2D-DMSO_24h-r4_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr263-MV411_MEF2D-DMSO_24h-r4_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr264-MV411_MEF2D-VHL_24h-r1_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr264-MV411_MEF2D-VHL_24h-r1_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr265-MV411_MEF2D-VHL_24h-r2_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr265-MV411_MEF2D-VHL_24h-r2_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr266-MV411_MEF2D-VHL_24h-r3_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr266-MV411_MEF2D-VHL_24h-r3_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr267-MV411_MEF2D-VHL_24h-r4_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr267-MV411_MEF2D-VHL_24h-r4_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr268-MV411-PBS_24h-r1_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr268-MV411-PBS_24h-r1_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr269-MV411-PBS_24h-r2_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr269-MV411-PBS_24h-r2_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr270-MV411-PBS_24h-r3_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr270-MV411-PBS_24h-r3_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr271-MV411-PBS_24h-r4_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr271-MV411-PBS_24h-r4_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr272-MV411-MYBi_24h-r1_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr272-MV411-MYBi_24h-r1_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr273-MV411-MYBi_24h-r2_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr273-MV411-MYBi_24h-r2_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr274-MV411-MYBi_24h-r3_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr274-MV411-MYBi_24h-r3_R2_001.fastq.gz']
In [4]:
! pip3 install git+https://github.com/jkobject/slamdunk.git --upgrade
# please also install trimgalore and cutadapt
Collecting git+https://github.com/jkobject/slamdunk.git
  Cloning https://github.com/jkobject/slamdunk.git to /tmp/pip-req-build-qa580_ce
Requirement already satisfied, skipping upgrade: joblib>=0.9.4 in /home/jeremie/.local/lib/python3.8/site-packages (from slamdunk==0.4.0) (0.14.1)
Requirement already satisfied, skipping upgrade: pybedtools>=0.6.4 in /home/jeremie/.local/lib/python3.8/site-packages (from slamdunk==0.4.0) (0.8.1)
Requirement already satisfied, skipping upgrade: intervaltree>=2.1.0 in /home/jeremie/.local/lib/python3.8/site-packages (from slamdunk==0.4.0) (3.0.2)
Requirement already satisfied, skipping upgrade: pandas>=0.13.1 in /home/jeremie/.local/lib/python3.8/site-packages (from slamdunk==0.4.0) (1.0.3)
Requirement already satisfied, skipping upgrade: biopython>=1.63 in /home/jeremie/.local/lib/python3.8/site-packages (from slamdunk==0.4.0) (1.77)
Requirement already satisfied, skipping upgrade: pysam>=0.8.3 in /home/jeremie/.local/lib/python3.8/site-packages (from slamdunk==0.4.0) (0.15.4)
Requirement already satisfied, skipping upgrade: Cython>=0.20.1 in /home/jeremie/.local/lib/python3.8/site-packages (from slamdunk==0.4.0) (0.29.17)
Requirement already satisfied, skipping upgrade: six in /home/jeremie/.local/lib/python3.8/site-packages (from pybedtools>=0.6.4->slamdunk==0.4.0) (1.14.0)
Requirement already satisfied, skipping upgrade: sortedcontainers<3.0,>=2.0 in /home/jeremie/.local/lib/python3.8/site-packages (from intervaltree>=2.1.0->slamdunk==0.4.0) (2.2.2)
Requirement already satisfied, skipping upgrade: pytz>=2017.2 in /home/jeremie/.local/lib/python3.8/site-packages (from pandas>=0.13.1->slamdunk==0.4.0) (2020.1)
Requirement already satisfied, skipping upgrade: python-dateutil>=2.6.1 in /home/jeremie/.local/lib/python3.8/site-packages (from pandas>=0.13.1->slamdunk==0.4.0) (2.8.1)
Requirement already satisfied, skipping upgrade: numpy>=1.13.3 in /home/jeremie/.local/lib/python3.8/site-packages (from pandas>=0.13.1->slamdunk==0.4.0) (1.18.4)
Building wheels for collected packages: slamdunk
  Running setup.py bdist_wheel for slamdunk ... done
  Stored in directory: /tmp/pip-ephem-wheel-cache-cggtrlco/wheels/4c/b2/9c/e1153807b1571f6f12ee9761dcf5229ceee161c5c575b631fd
Successfully built slamdunk
Installing collected packages: slamdunk
  Found existing installation: slamdunk 0.4.0
    Uninstalling slamdunk-0.4.0:
      Successfully uninstalled slamdunk-0.4.0
Successfully installed slamdunk-0.4.0
In [36]:
parrun(['../../TrimGalore-0.6.5/trim_galore --paired --cores 4 --retain_unpaired -stringency 3 --illumina '+val1+ ' '+val2+' -o '+folder_bams for val1,val2 in grouped(bams,2)],2)
In [ ]:
rm fastqs/*.fastq.gz
In [23]:
ls -al ../../data/$project/fastqs
total 323740620
drwxr-xr-x 2 jeremie jeremie      20480 Jul 16 23:59 ./
drwxr-xr-x 3 jeremie jeremie       4096 Jul 16 16:48 ../
-rw-r--r-- 1 jeremie jeremie 1972661712 Jul 16 16:09 mr193-MV411-MYBi_30m-r1_R1_001.fastq.gz
-rw-r--r-- 1 jeremie jeremie       4078 Jul 16 17:28 mr193-MV411-MYBi_30m-r1_R1_001.fastq.gz_trimming_report.txt
-rw-r--r-- 1 jeremie jeremie 1745221196 Jul 16 17:28 mr193-MV411-MYBi_30m-r1_R1_001_trimmed.fq.gz
-rw-r--r-- 1 jeremie jeremie 2001846977 Jul 16 16:11 mr193-MV411-MYBi_30m-r1_R2_001.fastq.gz
-rw-r--r-- 1 jeremie jeremie       4042 Jul 16 18:04 mr193-MV411-MYBi_30m-r1_R2_001.fastq.gz_trimming_report.txt
-rw-r--r-- 1 jeremie jeremie 1771675421 Jul 16 18:04 mr193-MV411-MYBi_30m-r1_R2_001_trimmed.fq.gz
-rw-r--r-- 1 jeremie jeremie 1883635938 Jul 16 16:11 mr194-MV411-MYBi_30m-r2_R1_001.fastq.gz
-rw-r--r-- 1 jeremie jeremie       4101 Jul 16 18:03 mr194-MV411-MYBi_30m-r2_R1_001.fastq.gz_trimming_report.txt
-rw-r--r-- 1 jeremie jeremie 1656441393 Jul 16 18:03 mr194-MV411-MYBi_30m-r2_R1_001_trimmed.fq.gz
-rw-r--r-- 1 jeremie jeremie 1898121444 Jul 16 16:09 mr194-MV411-MYBi_30m-r2_R2_001.fastq.gz
-rw-r--r-- 1 jeremie jeremie       4064 Jul 16 18:03 mr194-MV411-MYBi_30m-r2_R2_001.fastq.gz_trimming_report.txt
-rw-r--r-- 1 jeremie jeremie 1668987747 Jul 16 18:03 mr194-MV411-MYBi_30m-r2_R2_001_trimmed.fq.gz
-rw-r--r-- 1 jeremie jeremie 3664144900 Jul 16 16:10 mr195-MV411-MYBi_30m-r3_R1_001.fastq.gz
-rw-r--r-- 1 jeremie jeremie       4179 Jul 16 18:16 mr195-MV411-MYBi_30m-r3_R1_001.fastq.gz_trimming_report.txt
-rw-r--r-- 1 jeremie jeremie 3226927282 Jul 16 18:16 mr195-MV411-MYBi_30m-r3_R1_001_trimmed.fq.gz
-rw-r--r-- 1 jeremie jeremie 3716451047 Jul 16 16:10 mr195-MV411-MYBi_30m-r3_R2_001.fastq.gz
-rw-r--r-- 1 jeremie jeremie       4149 Jul 16 18:17 mr195-MV411-MYBi_30m-r3_R2_001.fastq.gz_trimming_report.txt
-rw-r--r-- 1 jeremie jeremie 3273624821 Jul 16 18:17 mr195-MV411-MYBi_30m-r3_R2_001_trimmed.fq.gz
-rw-r--r-- 1 jeremie jeremie 1752447342 Jul 16 16:09 mr196-MV411-MYBi_30m-r4_R1_001.fastq.gz
-rw-r--r-- 1 jeremie jeremie       4123 Jul 16 18:02 mr196-MV411-MYBi_30m-r4_R1_001.fastq.gz_trimming_report.txt
-rw-r--r-- 1 jeremie jeremie 1530559903 Jul 16 18:02 mr196-MV411-MYBi_30m-r4_R1_001_trimmed.fq.gz
-rw-r--r-- 1 jeremie jeremie 1772529030 Jul 16 16:09 mr196-MV411-MYBi_30m-r4_R2_001.fastq.gz
-rw-r--r-- 1 jeremie jeremie       4075 Jul 16 18:39 mr196-MV411-MYBi_30m-r4_R2_001.fastq.gz_trimming_report.txt
-rw-r--r-- 1 jeremie jeremie 1553594531 Jul 16 18:39 mr196-MV411-MYBi_30m-r4_R2_001_trimmed.fq.gz
-rw-r--r-- 1 jeremie jeremie 2613576581 Jul 16 16:11 mr197-MV411-PBS_30m-r1_R1_001.fastq.gz
-rw-r--r-- 1 jeremie jeremie       3987 Jul 16 18:47 mr197-MV411-PBS_30m-r1_R1_001.fastq.gz_trimming_report.txt
-rw-r--r-- 1 jeremie jeremie 2326678410 Jul 16 18:47 mr197-MV411-PBS_30m-r1_R1_001_trimmed.fq.gz
-rw-r--r-- 1 jeremie jeremie 2630133074 Jul 16 16:10 mr197-MV411-PBS_30m-r1_R2_001.fastq.gz
-rw-r--r-- 1 jeremie jeremie       3976 Jul 16 18:48 mr197-MV411-PBS_30m-r1_R2_001.fastq.gz_trimming_report.txt
-rw-r--r-- 1 jeremie jeremie 2341617043 Jul 16 18:48 mr197-MV411-PBS_30m-r1_R2_001_trimmed.fq.gz
-rw-r--r-- 1 jeremie jeremie 3351245240 Jul 16 16:10 mr198-MV411-PBS_30m-r2_R1_001.fastq.gz
-rw-r--r-- 1 jeremie jeremie       4147 Jul 16 18:53 mr198-MV411-PBS_30m-r2_R1_001.fastq.gz_trimming_report.txt
-rw-r--r-- 1 jeremie jeremie 2957225726 Jul 16 18:53 mr198-MV411-PBS_30m-r2_R1_001_trimmed.fq.gz
-rw-r--r-- 1 jeremie jeremie 3373272401 Jul 16 16:11 mr198-MV411-PBS_30m-r2_R2_001.fastq.gz
-rw-r--r-- 1 jeremie jeremie       4120 Jul 16 18:53 mr198-MV411-PBS_30m-r2_R2_001.fastq.gz_trimming_report.txt
-rw-r--r-- 1 jeremie jeremie 2973225065 Jul 16 18:53 mr198-MV411-PBS_30m-r2_R2_001_trimmed.fq.gz
-rw-r--r-- 1 jeremie jeremie 1960596780 Jul 16 16:11 mr199-MV411-PBS_30m-r3_R1_001.fastq.gz
-rw-r--r-- 1 jeremie jeremie       4110 Jul 16 18:41 mr199-MV411-PBS_30m-r3_R1_001.fastq.gz_trimming_report.txt
-rw-r--r-- 1 jeremie jeremie 1725990637 Jul 16 18:41 mr199-MV411-PBS_30m-r3_R1_001_trimmed.fq.gz
-rw-r--r-- 1 jeremie jeremie 1979110852 Jul 16 16:10 mr199-MV411-PBS_30m-r3_R2_001.fastq.gz
-rw-r--r-- 1 jeremie jeremie       4065 Jul 16 19:19 mr199-MV411-PBS_30m-r3_R2_001.fastq.gz_trimming_report.txt
-rw-r--r-- 1 jeremie jeremie 1742107228 Jul 16 19:19 mr199-MV411-PBS_30m-r3_R2_001_trimmed.fq.gz
-rw-r--r-- 1 jeremie jeremie 2812669024 Jul 16 16:11 mr200-MV411-PBS_30m-r4_R1_001.fastq.gz
-rw-r--r-- 1 jeremie jeremie       4152 Jul 16 19:29 mr200-MV411-PBS_30m-r4_R1_001.fastq.gz_trimming_report.txt
-rw-r--r-- 1 jeremie jeremie 2476347201 Jul 16 19:29 mr200-MV411-PBS_30m-r4_R1_001_trimmed.fq.gz
-rw-r--r-- 1 jeremie jeremie 2815436494 Jul 16 16:11 mr200-MV411-PBS_30m-r4_R2_001.fastq.gz
-rw-r--r-- 1 jeremie jeremie       4137 Jul 16 19:29 mr200-MV411-PBS_30m-r4_R2_001.fastq.gz_trimming_report.txt
-rw-r--r-- 1 jeremie jeremie 2480425633 Jul 16 19:29 mr200-MV411-PBS_30m-r4_R2_001_trimmed.fq.gz
-rw-r--r-- 1 jeremie jeremie 1640869794 Jul 16 16:11 mr201-MV411-MYBi_6h-r1_R1_001.fastq.gz
-rw-r--r-- 1 jeremie jeremie       3981 Jul 16 19:16 mr201-MV411-MYBi_6h-r1_R1_001.fastq.gz_trimming_report.txt
-rw-r--r-- 1 jeremie jeremie 1441679301 Jul 16 19:16 mr201-MV411-MYBi_6h-r1_R1_001_trimmed.fq.gz
-rw-r--r-- 1 jeremie jeremie 1687581392 Jul 16 16:10 mr201-MV411-MYBi_6h-r1_R2_001.fastq.gz
-rw-r--r-- 1 jeremie jeremie       3978 Jul 16 19:17 mr201-MV411-MYBi_6h-r1_R2_001.fastq.gz_trimming_report.txt
-rw-r--r-- 1 jeremie jeremie 1487580959 Jul 16 19:17 mr201-MV411-MYBi_6h-r1_R2_001_trimmed.fq.gz
-rw-r--r-- 1 jeremie jeremie 1802713797 Jul 16 16:05 mr202-MV411-MYBi_6h-r2_R1_001.fastq.gz
-rw-r--r-- 1 jeremie jeremie       4021 Jul 16 19:18 mr202-MV411-MYBi_6h-r2_R1_001.fastq.gz_trimming_report.txt
-rw-r--r-- 1 jeremie jeremie 1579927411 Jul 16 19:18 mr202-MV411-MYBi_6h-r2_R1_001_trimmed.fq.gz
-rw-r--r-- 1 jeremie jeremie 1818642533 Jul 16 16:06 mr202-MV411-MYBi_6h-r2_R2_001.fastq.gz
-rw-r--r-- 1 jeremie jeremie       4001 Jul 16 19:58 mr202-MV411-MYBi_6h-r2_R2_001.fastq.gz_trimming_report.txt
-rw-r--r-- 1 jeremie jeremie 1595008850 Jul 16 19:58 mr202-MV411-MYBi_6h-r2_R2_001_trimmed.fq.gz
-rw-r--r-- 1 jeremie jeremie 1388870538 Jul 16 16:07 mr203-MV411-MYBi_6h-r3_R1_001.fastq.gz
-rw-r--r-- 1 jeremie jeremie       3973 Jul 16 19:55 mr203-MV411-MYBi_6h-r3_R1_001.fastq.gz_trimming_report.txt
-rw-r--r-- 1 jeremie jeremie 1222904350 Jul 16 19:55 mr203-MV411-MYBi_6h-r3_R1_001_trimmed.fq.gz
-rw-r--r-- 1 jeremie jeremie 1393817218 Jul 16 16:10 mr203-MV411-MYBi_6h-r3_R2_001.fastq.gz
-rw-r--r-- 1 jeremie jeremie       3943 Jul 16 19:55 mr203-MV411-MYBi_6h-r3_R2_001.fastq.gz_trimming_report.txt
-rw-r--r-- 1 jeremie jeremie 1229376298 Jul 16 19:55 mr203-MV411-MYBi_6h-r3_R2_001_trimmed.fq.gz
-rw-r--r-- 1 jeremie jeremie 1405742865 Jul 16 16:05 mr204-MV411-MYBi_6h-r4_R1_001.fastq.gz
-rw-r--r-- 1 jeremie jeremie       4080 Jul 16 19:55 mr204-MV411-MYBi_6h-r4_R1_001.fastq.gz_trimming_report.txt
-rw-r--r-- 1 jeremie jeremie 1220634069 Jul 16 19:55 mr204-MV411-MYBi_6h-r4_R1_001_trimmed.fq.gz
-rw-r--r-- 1 jeremie jeremie 1428450634 Jul 16 16:03 mr204-MV411-MYBi_6h-r4_R2_001.fastq.gz
-rw-r--r-- 1 jeremie jeremie       4036 Jul 16 19:55 mr204-MV411-MYBi_6h-r4_R2_001.fastq.gz_trimming_report.txt
-rw-r--r-- 1 jeremie jeremie 1248721580 Jul 16 19:55 mr204-MV411-MYBi_6h-r4_R2_001_trimmed.fq.gz
-rw-r--r-- 1 jeremie jeremie 1723738018 Jul 16 16:08 mr205-MV411-PBS_6h-r1_R1_001.fastq.gz
-rw-r--r-- 1 jeremie jeremie       4017 Jul 16 19:58 mr205-MV411-PBS_6h-r1_R1_001.fastq.gz_trimming_report.txt
-rw-r--r-- 1 jeremie jeremie 1525341762 Jul 16 19:58 mr205-MV411-PBS_6h-r1_R1_001_trimmed.fq.gz
-rw-r--r-- 1 jeremie jeremie 1738665340 Jul 16 16:06 mr205-MV411-PBS_6h-r1_R2_001.fastq.gz
-rw-r--r-- 1 jeremie jeremie       3996 Jul 16 20:18 mr205-MV411-PBS_6h-r1_R2_001.fastq.gz_trimming_report.txt
-rw-r--r-- 1 jeremie jeremie 1539009328 Jul 16 20:18 mr205-MV411-PBS_6h-r1_R2_001_trimmed.fq.gz
-rw-r--r-- 1 jeremie jeremie 1935183307 Jul 16 16:04 mr206-MV411-PBS_6h-r2_R1_001.fastq.gz
-rw-r--r-- 1 jeremie jeremie       4094 Jul 16 20:20 mr206-MV411-PBS_6h-r2_R1_001.fastq.gz_trimming_report.txt
-rw-r--r-- 1 jeremie jeremie 1698865919 Jul 16 20:20 mr206-MV411-PBS_6h-r2_R1_001_trimmed.fq.gz
-rw-r--r-- 1 jeremie jeremie 1938026916 Jul 16 16:08 mr206-MV411-PBS_6h-r2_R2_001.fastq.gz
-rw-r--r-- 1 jeremie jeremie       4060 Jul 16 20:20 mr206-MV411-PBS_6h-r2_R2_001.fastq.gz_trimming_report.txt
-rw-r--r-- 1 jeremie jeremie 1702339869 Jul 16 20:20 mr206-MV411-PBS_6h-r2_R2_001_trimmed.fq.gz
-rw-r--r-- 1 jeremie jeremie 1793762688 Jul 16 16:07 mr207-MV411-PBS_6h-r3_R1_001.fastq.gz
-rw-r--r-- 1 jeremie jeremie       4033 Jul 16 20:19 mr207-MV411-PBS_6h-r3_R1_001.fastq.gz_trimming_report.txt
-rw-r--r-- 1 jeremie jeremie 1586015735 Jul 16 20:19 mr207-MV411-PBS_6h-r3_R1_001_trimmed.fq.gz
-rw-r--r-- 1 jeremie jeremie 1813410492 Jul 16 16:04 mr207-MV411-PBS_6h-r3_R2_001.fastq.gz
-rw-r--r-- 1 jeremie jeremie       4020 Jul 16 20:19 mr207-MV411-PBS_6h-r3_R2_001.fastq.gz_trimming_report.txt
-rw-r--r-- 1 jeremie jeremie 1603512570 Jul 16 20:19 mr207-MV411-PBS_6h-r3_R2_001_trimmed.fq.gz
-rw-r--r-- 1 jeremie jeremie 5221458520 Jul 16 16:06 mr208-MV411-MS2-r1_R1_001.fastq.gz
-rw-r--r-- 1 jeremie jeremie       4075 Jul 16 20:42 mr208-MV411-MS2-r1_R1_001.fastq.gz_trimming_report.txt
-rw-r--r-- 1 jeremie jeremie 4623601516 Jul 16 20:42 mr208-MV411-MS2-r1_R1_001_trimmed.fq.gz
-rw-r--r-- 1 jeremie jeremie 5504666780 Jul 16 16:09 mr208-MV411-MS2-r1_R2_001.fastq.gz
-rw-r--r-- 1 jeremie jeremie       4067 Jul 16 21:40 mr208-MV411-MS2-r1_R2_001.fastq.gz_trimming_report.txt
-rw-r--r-- 1 jeremie jeremie 4890310087 Jul 16 21:40 mr208-MV411-MS2-r1_R2_001_trimmed.fq.gz
-rw-r--r-- 1 jeremie jeremie 3613939790 Jul 16 16:04 mr209-MV411-MS2-r2_R1_001.fastq.gz
-rw-r--r-- 1 jeremie jeremie       4082 Jul 16 21:25 mr209-MV411-MS2-r2_R1_001.fastq.gz_trimming_report.txt
-rw-r--r-- 1 jeremie jeremie 3183551639 Jul 16 21:25 mr209-MV411-MS2-r2_R1_001_trimmed.fq.gz
-rw-r--r-- 1 jeremie jeremie 3725862188 Jul 16 16:05 mr209-MV411-MS2-r2_R2_001.fastq.gz
-rw-r--r-- 1 jeremie jeremie       4049 Jul 16 21:26 mr209-MV411-MS2-r2_R2_001.fastq.gz_trimming_report.txt
-rw-r--r-- 1 jeremie jeremie 3288974634 Jul 16 21:26 mr209-MV411-MS2-r2_R2_001_trimmed.fq.gz
-rw-r--r-- 1 jeremie jeremie 5605534301 Jul 16 16:11 mr210-MV411-MS2-r3_R1_001.fastq.gz
-rw-r--r-- 1 jeremie jeremie       4134 Jul 16 21:41 mr210-MV411-MS2-r3_R1_001.fastq.gz_trimming_report.txt
-rw-r--r-- 1 jeremie jeremie 4956550926 Jul 16 21:41 mr210-MV411-MS2-r3_R1_001_trimmed.fq.gz
-rw-r--r-- 1 jeremie jeremie 5746216216 Jul 16 16:05 mr210-MV411-MS2-r3_R2_001.fastq.gz
-rw-r--r-- 1 jeremie jeremie       4123 Jul 16 21:42 mr210-MV411-MS2-r3_R2_001.fastq.gz_trimming_report.txt
-rw-r--r-- 1 jeremie jeremie 5085018818 Jul 16 21:42 mr210-MV411-MS2-r3_R2_001_trimmed.fq.gz
-rw-r--r-- 1 jeremie jeremie 4636072209 Jul 16 16:07 mr211-MV411-JQ1-r1_R1_001.fastq.gz
-rw-r--r-- 1 jeremie jeremie       4184 Jul 16 21:34 mr211-MV411-JQ1-r1_R1_001.fastq.gz_trimming_report.txt
-rw-r--r-- 1 jeremie jeremie 4086164269 Jul 16 21:34 mr211-MV411-JQ1-r1_R1_001_trimmed.fq.gz
-rw-r--r-- 1 jeremie jeremie 4801855817 Jul 16 16:08 mr211-MV411-JQ1-r1_R2_001.fastq.gz
-rw-r--r-- 1 jeremie jeremie       4150 Jul 16 22:53 mr211-MV411-JQ1-r1_R2_001.fastq.gz_trimming_report.txt
-rw-r--r-- 1 jeremie jeremie 4241004493 Jul 16 22:53 mr211-MV411-JQ1-r1_R2_001_trimmed.fq.gz
-rw-r--r-- 1 jeremie jeremie 3945710281 Jul 16 16:06 mr212-MV411-JQ1-r2_R1_001.fastq.gz
-rw-r--r-- 1 jeremie jeremie       4189 Jul 16 22:46 mr212-MV411-JQ1-r2_R1_001.fastq.gz_trimming_report.txt
-rw-r--r-- 1 jeremie jeremie 3461066842 Jul 16 22:46 mr212-MV411-JQ1-r2_R1_001_trimmed.fq.gz
-rw-r--r-- 1 jeremie jeremie 3996185748 Jul 16 16:08 mr212-MV411-JQ1-r2_R2_001.fastq.gz
-rw-r--r-- 1 jeremie jeremie       4144 Jul 16 22:47 mr212-MV411-JQ1-r2_R2_001.fastq.gz_trimming_report.txt
-rw-r--r-- 1 jeremie jeremie 3519529968 Jul 16 22:47 mr212-MV411-JQ1-r2_R2_001_trimmed.fq.gz
-rw-r--r-- 1 jeremie jeremie 4615295045 Jul 16 16:08 mr213-MV411-JQ1-r3_R1_001.fastq.gz
-rw-r--r-- 1 jeremie jeremie       4169 Jul 16 22:52 mr213-MV411-JQ1-r3_R1_001.fastq.gz_trimming_report.txt
-rw-r--r-- 1 jeremie jeremie 4065121374 Jul 16 22:52 mr213-MV411-JQ1-r3_R1_001_trimmed.fq.gz
-rw-r--r-- 1 jeremie jeremie 4698448026 Jul 16 16:06 mr213-MV411-JQ1-r3_R2_001.fastq.gz
-rw-r--r-- 1 jeremie jeremie       4142 Jul 16 22:53 mr213-MV411-JQ1-r3_R2_001.fastq.gz_trimming_report.txt
-rw-r--r-- 1 jeremie jeremie 4143911322 Jul 16 22:53 mr213-MV411-JQ1-r3_R2_001_trimmed.fq.gz
-rw-r--r-- 1 jeremie jeremie 5192687737 Jul 16 16:11 mr214-MV411-MS2_JQ1-r1_R1_001.fastq.gz
-rw-r--r-- 1 jeremie jeremie       4193 Jul 16 22:56 mr214-MV411-MS2_JQ1-r1_R1_001.fastq.gz_trimming_report.txt
-rw-r--r-- 1 jeremie jeremie 4576147106 Jul 16 22:56 mr214-MV411-MS2_JQ1-r1_R1_001_trimmed.fq.gz
-rw-r--r-- 1 jeremie jeremie 5315271182 Jul 16 16:06 mr214-MV411-MS2_JQ1-r1_R2_001.fastq.gz
-rw-r--r-- 1 jeremie jeremie       4157 Jul 16 23:56 mr214-MV411-MS2_JQ1-r1_R2_001.fastq.gz_trimming_report.txt
-rw-r--r-- 1 jeremie jeremie 4684702188 Jul 16 23:56 mr214-MV411-MS2_JQ1-r1_R2_001_trimmed.fq.gz
-rw-r--r-- 1 jeremie jeremie 5509754689 Jul 16 16:09 mr215-MV411-MS2_JQ1-r2_R1_001.fastq.gz
-rw-r--r-- 1 jeremie jeremie       4238 Jul 16 23:58 mr215-MV411-MS2_JQ1-r2_R1_001.fastq.gz_trimming_report.txt
-rw-r--r-- 1 jeremie jeremie 4835138491 Jul 16 23:58 mr215-MV411-MS2_JQ1-r2_R1_001_trimmed.fq.gz
-rw-r--r-- 1 jeremie jeremie 5741983634 Jul 16 16:09 mr215-MV411-MS2_JQ1-r2_R2_001.fastq.gz
-rw-r--r-- 1 jeremie jeremie       4211 Jul 16 23:59 mr215-MV411-MS2_JQ1-r2_R2_001.fastq.gz_trimming_report.txt
-rw-r--r-- 1 jeremie jeremie 5044583239 Jul 16 23:59 mr215-MV411-MS2_JQ1-r2_R2_001_trimmed.fq.gz
-rw-r--r-- 1 jeremie jeremie 5589321931 Jul 16 16:06 mr216-MV411-MS2_JQ1-r3_R1_001.fastq.gz
-rw-r--r-- 1 jeremie jeremie       4172 Jul 16 23:58 mr216-MV411-MS2_JQ1-r3_R1_001.fastq.gz_trimming_report.txt
-rw-r--r-- 1 jeremie jeremie 4936956685 Jul 16 23:58 mr216-MV411-MS2_JQ1-r3_R1_001_trimmed.fq.gz
-rw-r--r-- 1 jeremie jeremie 5658383246 Jul 16 16:08 mr216-MV411-MS2_JQ1-r3_R2_001.fastq.gz
-rw-r--r-- 1 jeremie jeremie       4141 Jul 16 23:59 mr216-MV411-MS2_JQ1-r3_R2_001.fastq.gz_trimming_report.txt
-rw-r--r-- 1 jeremie jeremie 5002806305 Jul 16 23:59 mr216-MV411-MS2_JQ1-r3_R2_001_trimmed.fq.gz
-rw-r--r-- 1 jeremie jeremie 4051640144 Jul 16 16:09 mr217-MV411-DMSO-r1_R1_001.fastq.gz
-rw-r--r-- 1 jeremie jeremie       4047 Jul 16 23:44 mr217-MV411-DMSO-r1_R1_001.fastq.gz_trimming_report.txt
-rw-r--r-- 1 jeremie jeremie 3593376280 Jul 16 23:44 mr217-MV411-DMSO-r1_R1_001_trimmed.fq.gz
-rw-r--r-- 1 jeremie jeremie 4194658762 Jul 16 16:06 mr217-MV411-DMSO-r1_R2_001.fastq.gz
-rw-r--r-- 1 jeremie jeremie       4026 Jul 17 00:39 mr217-MV411-DMSO-r1_R2_001.fastq.gz_trimming_report.txt
-rw-r--r-- 1 jeremie jeremie 3728280128 Jul 17 00:39 mr217-MV411-DMSO-r1_R2_001_trimmed.fq.gz
-rw-r--r-- 1 jeremie jeremie 4375154174 Jul 16 16:07 mr218-MV411-DMSO-r2_R1_001.fastq.gz
-rw-r--r-- 1 jeremie jeremie       4100 Jul 17 00:40 mr218-MV411-DMSO-r2_R1_001.fastq.gz_trimming_report.txt
-rw-r--r-- 1 jeremie jeremie 3864291280 Jul 17 00:40 mr218-MV411-DMSO-r2_R1_001_trimmed.fq.gz
-rw-r--r-- 1 jeremie jeremie 4564711176 Jul 16 16:06 mr218-MV411-DMSO-r2_R2_001.fastq.gz
-rw-r--r-- 1 jeremie jeremie       4076 Jul 17 00:42 mr218-MV411-DMSO-r2_R2_001.fastq.gz_trimming_report.txt
-rw-r--r-- 1 jeremie jeremie 4042600721 Jul 17 00:42 mr218-MV411-DMSO-r2_R2_001_trimmed.fq.gz
-rw-r--r-- 1 jeremie jeremie 3021404797 Jul 16 16:09 mr219-MV411-DMSO-r3_R1_001.fastq.gz
-rw-r--r-- 1 jeremie jeremie       3984 Jul 17 00:30 mr219-MV411-DMSO-r3_R1_001.fastq.gz_trimming_report.txt
-rw-r--r-- 1 jeremie jeremie 2676601777 Jul 17 00:30 mr219-MV411-DMSO-r3_R1_001_trimmed.fq.gz
-rw-r--r-- 1 jeremie jeremie 3081595402 Jul 16 16:07 mr219-MV411-DMSO-r3_R2_001.fastq.gz
-rw-r--r-- 1 jeremie jeremie       3968 Jul 17 00:31 mr219-MV411-DMSO-r3_R2_001.fastq.gz_trimming_report.txt
-rw-r--r-- 1 jeremie jeremie 2732365180 Jul 17 00:31 mr219-MV411-DMSO-r3_R2_001_trimmed.fq.gz
In [37]:
# using an ERCC ref genome (you can just append ERCC fasta to the hg38 fasta)
refgenome="../../data/ref/Homo_sapiens_assembly38_ERCC92.fasta"
In [44]:
bams
Out[44]:
['../../data/slamseqMax/fastqs//mr252-MV411_MEF2D-DMSO_2h-r1_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr252-MV411_MEF2D-DMSO_2h-r1_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr253-MV411_MEF2D-DMSO_2h-r2_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr253-MV411_MEF2D-DMSO_2h-r2_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr254-MV411_MEF2D-DMSO_2h-r3_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr254-MV411_MEF2D-DMSO_2h-r3_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr255-MV411_MEF2D-DMSO_2h-r4_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr255-MV411_MEF2D-DMSO_2h-r4_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr256-MV411_MEF2D-VHL_2h-r1_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr256-MV411_MEF2D-VHL_2h-r1_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr257-MV411_MEF2D-VHL_2h-r2_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr257-MV411_MEF2D-VHL_2h-r2_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr258-MV411_MEF2D-VHL_2h-r3_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr258-MV411_MEF2D-VHL_2h-r3_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr259-MV411_MEF2D-VHL_2h-r4_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr259-MV411_MEF2D-VHL_2h-r4_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr260-MV411_MEF2D-DMSO_24h-r1_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr260-MV411_MEF2D-DMSO_24h-r1_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr261-MV411_MEF2D-DMSO_24h-r2_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr261-MV411_MEF2D-DMSO_24h-r2_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr262-MV411_MEF2D-DMSO_24h-r3_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr262-MV411_MEF2D-DMSO_24h-r3_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr263-MV411_MEF2D-DMSO_24h-r4_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr263-MV411_MEF2D-DMSO_24h-r4_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr264-MV411_MEF2D-VHL_24h-r1_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr264-MV411_MEF2D-VHL_24h-r1_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr265-MV411_MEF2D-VHL_24h-r2_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr265-MV411_MEF2D-VHL_24h-r2_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr266-MV411_MEF2D-VHL_24h-r3_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr266-MV411_MEF2D-VHL_24h-r3_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr267-MV411_MEF2D-VHL_24h-r4_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr267-MV411_MEF2D-VHL_24h-r4_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr268-MV411-PBS_24h-r1_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr268-MV411-PBS_24h-r1_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr269-MV411-PBS_24h-r2_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr269-MV411-PBS_24h-r2_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr270-MV411-PBS_24h-r3_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr270-MV411-PBS_24h-r3_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr271-MV411-PBS_24h-r4_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr271-MV411-PBS_24h-r4_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr272-MV411-MYBi_24h-r1_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr272-MV411-MYBi_24h-r1_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr273-MV411-MYBi_24h-r2_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr273-MV411-MYBi_24h-r2_R2_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr274-MV411-MYBi_24h-r3_R1_001.fastq.gz',
 '../../data/slamseqMax/fastqs//mr274-MV411-MYBi_24h-r3_R2_001.fastq.gz']
In [46]:
# we are doing it paired end
parrun(['slamdunk all -r '+refgenome+' -b ../data/Muhar_Slamseq/GSE100708_hg38_refseq_062016_ensemblv84_3UTR.bed \
    -o ../../data/'+project+'/res/ -t 8 -c 2 -N '+val1.split('/')[-1].split('_R')[0]+' '+val1.replace('.fastq.gz','_val_1.fq.gz')+" "+val2.replace('.fastq.gz','_val_2.fq.gz') for val1,val2 in grouped(bams[4:],2)], 2)
In [47]:
ls ../../data/$project/res/count/*.tsv
../../data/slamseqMax/res/count/mr252-MV411_MEF2D-DMSO_2h-r1_tcount.tsv
../../data/slamseqMax/res/count/mr253-MV411_MEF2D-DMSO_2h-r2_tcount.tsv
../../data/slamseqMax/res/count/mr254-MV411_MEF2D-DMSO_2h-r3_tcount.tsv
../../data/slamseqMax/res/count/mr255-MV411_MEF2D-DMSO_2h-r4_tcount.tsv
../../data/slamseqMax/res/count/mr256-MV411_MEF2D-VHL_2h-r1_tcount.tsv
../../data/slamseqMax/res/count/mr257-MV411_MEF2D-VHL_2h-r2_tcount.tsv
../../data/slamseqMax/res/count/mr258-MV411_MEF2D-VHL_2h-r3_tcount.tsv
../../data/slamseqMax/res/count/mr259-MV411_MEF2D-VHL_2h-r4_tcount.tsv
../../data/slamseqMax/res/count/mr260-MV411_MEF2D-DMSO_24h-r1_tcount.tsv
../../data/slamseqMax/res/count/mr261-MV411_MEF2D-DMSO_24h-r2_tcount.tsv
../../data/slamseqMax/res/count/mr262-MV411_MEF2D-DMSO_24h-r3_tcount.tsv
../../data/slamseqMax/res/count/mr263-MV411_MEF2D-DMSO_24h-r4_tcount.tsv
../../data/slamseqMax/res/count/mr264-MV411_MEF2D-VHL_24h-r1_tcount.tsv
../../data/slamseqMax/res/count/mr265-MV411_MEF2D-VHL_24h-r2_tcount.tsv
../../data/slamseqMax/res/count/mr266-MV411_MEF2D-VHL_24h-r3_tcount.tsv
../../data/slamseqMax/res/count/mr267-MV411_MEF2D-VHL_24h-r4_tcount.tsv
../../data/slamseqMax/res/count/mr268-MV411-PBS_24h-r1_tcount.tsv
../../data/slamseqMax/res/count/mr269-MV411-PBS_24h-r2_tcount.tsv
../../data/slamseqMax/res/count/mr270-MV411-PBS_24h-r3_tcount.tsv
../../data/slamseqMax/res/count/mr271-MV411-PBS_24h-r4_tcount.tsv
../../data/slamseqMax/res/count/mr272-MV411-MYBi_24h-r1_tcount.tsv
../../data/slamseqMax/res/count/mr273-MV411-MYBi_24h-r2_tcount.tsv
../../data/slamseqMax/res/count/mr274-MV411-MYBi_24h-r3_tcount.tsv

we first need to recreate out RNA matrix from slamdunk's tcount files

In [358]:
!gsutil -m cp -r ../../data/$project/* gs://amlproject/RNA/slamseq_iBet_max/
Copying file://../../data/slamseqMax/fastqs/mr206-MV411-PBS_6h-r2_R2_001_unpaired_2.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr196-MV411-MYBi_30m-r4_R1_001.fastq.gz_trimming_report.txt [Content-Type=text/plain]...
Copying file://../../data/slamseqMax/fastqs/mr212-MV411-JQ1-r2_R2_001.fastq.gz_trimming_report.txt [Content-Type=text/plain]...
Copying file://../../data/slamseqMax/fastqs/mr209-MV411-MS2-r2_R1_001.fastq.gz_trimming_report.txt [Content-Type=text/plain]...
Copying file://../../data/slamseqMax/fastqs/mr193-MV411-MYBi_30m-r1_R1_001.fastq.gz_trimming_report.txt [Content-Type=text/plain]...
Copying file://../../data/slamseqMax/fastqs/mr195-MV411-MYBi_30m-r3_R1_001_val_1.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr200-MV411-PBS_30m-r4_R2_001_val_2.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr207-MV411-PBS_6h-r3_R1_001_unpaired_1.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr193-MV411-MYBi_30m-r1_R2_001.fastq.gz_trimming_report.txt [Content-Type=text/plain]...
Copying file://../../data/slamseqMax/fastqs/mr211-MV411-JQ1-r1_R2_001_unpaired_2.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr195-MV411-MYBi_30m-r3_R2_001_unpaired_2.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr217-MV411-DMSO-r1_R2_001.fastq.gz_trimming_report.txt [Content-Type=text/plain]...
==> NOTE: You are uploading one or more large file(s), which would run          
significantly faster if you enable parallel composite uploads. This
feature can be enabled by editing the
"parallel_composite_upload_threshold" value in your .boto
configuration file. However, note that if you do this large files will
be uploaded as `composite objects
<https://cloud.google.com/storage/docs/composite-objects>`_,which
means that any user who downloads such objects will need to have a
compiled crcmod installed (see "gsutil help crcmod"). This is because
without a compiled crcmod, computing checksums on composite objects is
so slow that gsutil disables downloads of composite objects.

Copying file://../../data/slamseqMax/fastqs/mr196-MV411-MYBi_30m-r4_R2_001.fastq.gz_trimming_report.txt [Content-Type=text/plain]...
Copying file://../../data/slamseqMax/fastqs/mr210-MV411-MS2-r3_R1_001_unpaired_1.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr194-MV411-MYBi_30m-r2_R2_001_unpaired_2.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr204-MV411-MYBi_6h-r4_R2_001.fastq.gz_trimming_report.txt [Content-Type=text/plain]...
Copying file://../../data/slamseqMax/fastqs/mr217-MV411-DMSO-r1_R1_001_val_1.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr200-MV411-PBS_30m-r4_R1_001_unpaired_1.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr201-MV411-MYBi_6h-r1_R1_001_val_1.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr207-MV411-PBS_6h-r3_R2_001.fastq.gz_trimming_report.txt [Content-Type=text/plain]...
Copying file://../../data/slamseqMax/fastqs/mr193-MV411-MYBi_30m-r1_R2_001_unpaired_2.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr206-MV411-PBS_6h-r2_R1_001_val_1.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr199-MV411-PBS_30m-r3_R2_001_val_2.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr211-MV411-JQ1-r1_R2_001.fastq.gz_trimming_report.txt [Content-Type=text/plain]...
Copying file://../../data/slamseqMax/fastqs/mr217-MV411-DMSO-r1_R1_001_unpaired_1.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr193-MV411-MYBi_30m-r1_R1_001_unpaired_1.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr194-MV411-MYBi_30m-r2_R1_001_unpaired_1.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr215-MV411-MS2_JQ1-r2_R1_001_unpaired_1.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr204-MV411-MYBi_6h-r4_R2_001_val_2.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr215-MV411-MS2_JQ1-r2_R1_001.fastq.gz_trimming_report.txt [Content-Type=text/plain]...
Copying file://../../data/slamseqMax/fastqs/mr211-MV411-JQ1-r1_R1_001_val_1.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr194-MV411-MYBi_30m-r2_R1_001.fastq.gz_trimming_report.txt [Content-Type=text/plain]...
Copying file://../../data/slamseqMax/fastqs/mr207-MV411-PBS_6h-r3_R1_001.fastq.gz_trimming_report.txt [Content-Type=text/plain]...
Copying file://../../data/slamseqMax/fastqs/mr194-MV411-MYBi_30m-r2_R2_001_val_2.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr202-MV411-MYBi_6h-r2_R1_001_val_1.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr213-MV411-JQ1-r3_R2_001_val_2.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr196-MV411-MYBi_30m-r4_R1_001_unpaired_1.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr197-MV411-PBS_30m-r1_R1_001_unpaired_1.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr194-MV411-MYBi_30m-r2_R2_001.fastq.gz_trimming_report.txt [Content-Type=text/plain]...
Copying file://../../data/slamseqMax/fastqs/mr200-MV411-PBS_30m-r4_R1_001_val_1.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr204-MV411-MYBi_6h-r4_R2_001_unpaired_2.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr197-MV411-PBS_30m-r1_R2_001_val_2.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr198-MV411-PBS_30m-r2_R1_001_unpaired_1.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr199-MV411-PBS_30m-r3_R1_001.fastq.gz_trimming_report.txt [Content-Type=text/plain]...
Copying file://../../data/slamseqMax/fastqs/mr198-MV411-PBS_30m-r2_R2_001.fastq.gz_trimming_report.txt [Content-Type=text/plain]...
Copying file://../../data/slamseqMax/fastqs/mr209-MV411-MS2-r2_R1_001_val_1.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr203-MV411-MYBi_6h-r3_R1_001_unpaired_1.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr205-MV411-PBS_6h-r1_R2_001_val_2.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr212-MV411-JQ1-r2_R1_001.fastq.gz_trimming_report.txt [Content-Type=text/plain]...
Copying file://../../data/slamseqMax/fastqs/mr210-MV411-MS2-r3_R2_001.fastq.gz_trimming_report.txt [Content-Type=text/plain]...
Copying file://../../data/slamseqMax/fastqs/mr212-MV411-JQ1-r2_R1_001_val_1.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr213-MV411-JQ1-r3_R2_001_unpaired_2.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr199-MV411-PBS_30m-r3_R2_001_unpaired_2.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr205-MV411-PBS_6h-r1_R1_001.fastq.gz_trimming_report.txt [Content-Type=text/plain]...
Copying file://../../data/slamseqMax/fastqs/mr193-MV411-MYBi_30m-r1_R1_001_val_1.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr219-MV411-DMSO-r3_R1_001_val_1.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr195-MV411-MYBi_30m-r3_R1_001.fastq.gz_trimming_report.txt [Content-Type=text/plain]...
Copying file://../../data/slamseqMax/fastqs/mr204-MV411-MYBi_6h-r4_R1_001.fastq.gz_trimming_report.txt [Content-Type=text/plain]...
Copying file://../../data/slamseqMax/fastqs/mr211-MV411-JQ1-r1_R1_001_unpaired_1.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr208-MV411-MS2-r1_R1_001_val_1.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr202-MV411-MYBi_6h-r2_R2_001.fastq.gz_trimming_report.txt [Content-Type=text/plain]...
Copying file://../../data/slamseqMax/fastqs/mr204-MV411-MYBi_6h-r4_R1_001_unpaired_1.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr215-MV411-MS2_JQ1-r2_R2_001_unpaired_2.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr214-MV411-MS2_JQ1-r1_R2_001_val_2.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr216-MV411-MS2_JQ1-r3_R2_001_unpaired_2.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr207-MV411-PBS_6h-r3_R2_001_unpaired_2.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr209-MV411-MS2-r2_R2_001_val_2.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr218-MV411-DMSO-r2_R2_001_unpaired_2.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr214-MV411-MS2_JQ1-r1_R1_001_unpaired_1.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr201-MV411-MYBi_6h-r1_R1_001.fastq.gz_trimming_report.txt [Content-Type=text/plain]...
Copying file://../../data/slamseqMax/fastqs/mr203-MV411-MYBi_6h-r3_R1_001.fastq.gz_trimming_report.txt [Content-Type=text/plain]...
Copying file://../../data/slamseqMax/fastqs/mr198-MV411-PBS_30m-r2_R2_001_unpaired_2.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr207-MV411-PBS_6h-r3_R2_001_val_2.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr196-MV411-MYBi_30m-r4_R2_001_unpaired_2.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr216-MV411-MS2_JQ1-r3_R2_001.fastq.gz_trimming_report.txt [Content-Type=text/plain]...
Copying file://../../data/slamseqMax/fastqs/mr199-MV411-PBS_30m-r3_R1_001_val_1.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr203-MV411-MYBi_6h-r3_R2_001_val_2.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr219-MV411-DMSO-r3_R1_001.fastq.gz_trimming_report.txt [Content-Type=text/plain]...
Copying file://../../data/slamseqMax/fastqs/mr212-MV411-JQ1-r2_R2_001_val_2.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr197-MV411-PBS_30m-r1_R2_001.fastq.gz_trimming_report.txt [Content-Type=text/plain]...
Copying file://../../data/slamseqMax/fastqs/mr209-MV411-MS2-r2_R1_001_unpaired_1.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr211-MV411-JQ1-r1_R2_001_val_2.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr198-MV411-PBS_30m-r2_R1_001_val_1.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr215-MV411-MS2_JQ1-r2_R1_001_val_1.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr214-MV411-MS2_JQ1-r1_R1_001_val_1.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr205-MV411-PBS_6h-r1_R2_001.fastq.gz_trimming_report.txt [Content-Type=text/plain]...
Copying file://../../data/slamseqMax/fastqs/mr198-MV411-PBS_30m-r2_R1_001.fastq.gz_trimming_report.txt [Content-Type=text/plain]...
Copying file://../../data/slamseqMax/fastqs/mr219-MV411-DMSO-r3_R2_001.fastq.gz_trimming_report.txt [Content-Type=text/plain]...
Copying file://../../data/slamseqMax/fastqs/mr212-MV411-JQ1-r2_R2_001_unpaired_2.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr209-MV411-MS2-r2_R2_001.fastq.gz_trimming_report.txt [Content-Type=text/plain]...
Copying file://../../data/slamseqMax/fastqs/mr206-MV411-PBS_6h-r2_R1_001.fastq.gz_trimming_report.txt [Content-Type=text/plain]...
Copying file://../../data/slamseqMax/fastqs/mr201-MV411-MYBi_6h-r1_R1_001_unpaired_1.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr206-MV411-PBS_6h-r2_R2_001_val_2.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr218-MV411-DMSO-r2_R1_001.fastq.gz_trimming_report.txt [Content-Type=text/plain]...
Copying file://../../data/slamseqMax/fastqs/mr214-MV411-MS2_JQ1-r1_R1_001.fastq.gz_trimming_report.txt [Content-Type=text/plain]...
Copying file://../../data/slamseqMax/fastqs/mr195-MV411-MYBi_30m-r3_R2_001_val_2.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr211-MV411-JQ1-r1_R1_001.fastq.gz_trimming_report.txt [Content-Type=text/plain]...
Copying file://../../data/slamseqMax/fastqs/mr197-MV411-PBS_30m-r1_R1_001_val_1.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr205-MV411-PBS_6h-r1_R1_001_unpaired_1.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr218-MV411-DMSO-r2_R1_001_val_1.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr197-MV411-PBS_30m-r1_R1_001.fastq.gz_trimming_report.txt [Content-Type=text/plain]...
Copying file://../../data/slamseqMax/fastqs/mr208-MV411-MS2-r1_R1_001.fastq.gz_trimming_report.txt [Content-Type=text/plain]...
Copying file://../../data/slamseqMax/fastqs/mr215-MV411-MS2_JQ1-r2_R2_001_val_2.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr210-MV411-MS2-r3_R1_001.fastq.gz_trimming_report.txt [Content-Type=text/plain]...
Copying file://../../data/slamseqMax/fastqs/mr196-MV411-MYBi_30m-r4_R1_001_val_1.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr195-MV411-MYBi_30m-r3_R2_001.fastq.gz_trimming_report.txt [Content-Type=text/plain]...
Copying file://../../data/slamseqMax/fastqs/mr199-MV411-PBS_30m-r3_R1_001_unpaired_1.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr210-MV411-MS2-r3_R2_001_unpaired_2.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr216-MV411-MS2_JQ1-r3_R1_001_unpaired_1.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr213-MV411-JQ1-r3_R1_001_val_1.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr203-MV411-MYBi_6h-r3_R1_001_val_1.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr205-MV411-PBS_6h-r1_R2_001_unpaired_2.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr198-MV411-PBS_30m-r2_R2_001_val_2.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr213-MV411-JQ1-r3_R2_001.fastq.gz_trimming_report.txt [Content-Type=text/plain]...
Copying file://../../data/slamseqMax/fastqs/mr215-MV411-MS2_JQ1-r2_R2_001.fastq.gz_trimming_report.txt [Content-Type=text/plain]...
Copying file://../../data/slamseqMax/fastqs/mr218-MV411-DMSO-r2_R2_001.fastq.gz_trimming_report.txt [Content-Type=text/plain]...
Copying file://../../data/slamseqMax/fastqs/mr202-MV411-MYBi_6h-r2_R2_001_val_2.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr201-MV411-MYBi_6h-r1_R2_001_unpaired_2.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr208-MV411-MS2-r1_R2_001.fastq.gz_trimming_report.txt [Content-Type=text/plain]...
Copying file://../../data/slamseqMax/fastqs/mr213-MV411-JQ1-r3_R1_001.fastq.gz_trimming_report.txt [Content-Type=text/plain]...
Copying file://../../data/slamseqMax/fastqs/mr202-MV411-MYBi_6h-r2_R1_001_unpaired_1.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr214-MV411-MS2_JQ1-r1_R2_001.fastq.gz_trimming_report.txt [Content-Type=text/plain]...
Copying file://../../data/slamseqMax/fastqs/mr217-MV411-DMSO-r1_R1_001.fastq.gz_trimming_report.txt [Content-Type=text/plain]...
Copying file://../../data/slamseqMax/fastqs/mr208-MV411-MS2-r1_R2_001_unpaired_2.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr200-MV411-PBS_30m-r4_R2_001_unpaired_2.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr208-MV411-MS2-r1_R1_001_unpaired_1.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr206-MV411-PBS_6h-r2_R1_001_unpaired_1.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr206-MV411-PBS_6h-r2_R2_001.fastq.gz_trimming_report.txt [Content-Type=text/plain]...
Copying file://../../data/slamseqMax/fastqs/mr203-MV411-MYBi_6h-r3_R2_001.fastq.gz_trimming_report.txt [Content-Type=text/plain]...
Copying file://../../data/slamseqMax/fastqs/mr208-MV411-MS2-r1_R2_001_val_2.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr207-MV411-PBS_6h-r3_R1_001_val_1.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr212-MV411-JQ1-r2_R1_001_unpaired_1.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr199-MV411-PBS_30m-r3_R2_001.fastq.gz_trimming_report.txt [Content-Type=text/plain]...
Copying file://../../data/slamseqMax/fastqs/mr216-MV411-MS2_JQ1-r3_R1_001_val_1.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr193-MV411-MYBi_30m-r1_R2_001_val_2.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr219-MV411-DMSO-r3_R2_001_val_2.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr205-MV411-PBS_6h-r1_R1_001_val_1.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr201-MV411-MYBi_6h-r1_R2_001_val_2.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr200-MV411-PBS_30m-r4_R1_001.fastq.gz_trimming_report.txt [Content-Type=text/plain]...
Copying file://../../data/slamseqMax/fastqs/mr214-MV411-MS2_JQ1-r1_R2_001_unpaired_2.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr219-MV411-DMSO-r3_R1_001_unpaired_1.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr209-MV411-MS2-r2_R2_001_unpaired_2.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr218-MV411-DMSO-r2_R2_001_val_2.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr210-MV411-MS2-r3_R2_001_val_2.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr202-MV411-MYBi_6h-r2_R2_001_unpaired_2.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr216-MV411-MS2_JQ1-r3_R1_001.fastq.gz_trimming_report.txt [Content-Type=text/plain]...
Copying file://../../data/slamseqMax/fastqs/mr197-MV411-PBS_30m-r1_R2_001_unpaired_2.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr217-MV411-DMSO-r1_R2_001_val_2.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr201-MV411-MYBi_6h-r1_R2_001.fastq.gz_trimming_report.txt [Content-Type=text/plain]...
Copying file://../../data/slamseqMax/fastqs/mr217-MV411-DMSO-r1_R2_001_unpaired_2.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr200-MV411-PBS_30m-r4_R2_001.fastq.gz_trimming_report.txt [Content-Type=text/plain]...
Copying file://../../data/slamseqMax/fastqs/mr203-MV411-MYBi_6h-r3_R2_001_unpaired_2.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr202-MV411-MYBi_6h-r2_R1_001.fastq.gz_trimming_report.txt [Content-Type=text/plain]...
Copying file://../../data/slamseqMax/fastqs/mr219-MV411-DMSO-r3_R2_001_unpaired_2.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr210-MV411-MS2-r3_R1_001_val_1.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr218-MV411-DMSO-r2_R1_001_unpaired_1.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr216-MV411-MS2_JQ1-r3_R2_001_val_2.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr195-MV411-MYBi_30m-r3_R1_001_unpaired_1.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr194-MV411-MYBi_30m-r2_R1_001_val_1.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr204-MV411-MYBi_6h-r4_R1_001_val_1.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr213-MV411-JQ1-r3_R1_001_unpaired_1.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/fastqs/mr196-MV411-MYBi_30m-r4_R2_001_val_2.fq.gz [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr213-MV411-JQ1-r3_tcount.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr193-MV411-MYBi_30m-r1_tcount_mins.bedgraph [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr195-MV411-MYBi_30m-r3_tcount_mins.bedgraph [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr211-MV411-JQ1-r1_tcount.tsv [Content-Type=text/tab-separated-values]...
Copying file://../../data/slamseqMax/res/count/mr217-MV411-DMSO-r1_tcount_plus.bedgraph [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr196-MV411-MYBi_30m-r4_tcount_plus.bedgraph [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr215-MV411-MS2_JQ1-r2_tcount.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr203-MV411-MYBi_6h-r3_tcount.tsv [Content-Type=text/tab-separated-values]...
Copying file://../../data/slamseqMax/res/count/mr194-MV411-MYBi_30m-r2_tcount.tsv [Content-Type=text/tab-separated-values]...
Copying file://../../data/slamseqMax/res/count/mr210-MV411-MS2-r3_tcount_mins.bedgraph [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr202-MV411-MYBi_6h-r2_tcount_plus.bedgraph [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr204-MV411-MYBi_6h-r4_tcount_plus.bedgraph [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr203-MV411-MYBi_6h-r3_tcount_mins.bedgraph [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr197-MV411-PBS_30m-r1_tcount.tsv [Content-Type=text/tab-separated-values]...
Copying file://../../data/slamseqMax/res/count/mr210-MV411-MS2-r3_tcount.tsv [Content-Type=text/tab-separated-values]...
Copying file://../../data/slamseqMax/res/count/mr218-MV411-DMSO-r2_tcount_mins.bedgraph [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr201-MV411-MYBi_6h-r1_tcount_mins.bedgraph [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr206-MV411-PBS_6h-r2_tcount_plus.bedgraph [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr199-MV411-PBS_30m-r3_tcount.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr196-MV411-MYBi_30m-r4_tcount.tsv [Content-Type=text/tab-separated-values]...
Copying file://../../data/slamseqMax/res/count/mr213-MV411-JQ1-r3_tcount_mins.bedgraph [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr214-MV411-MS2_JQ1-r1_tcount_mins.bedgraph [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr212-MV411-JQ1-r2_tcount.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr211-MV411-JQ1-r1_tcount_mins.bedgraph [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr207-MV411-PBS_6h-r3_tcount_plus.bedgraph [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr202-MV411-MYBi_6h-r2_tcount_mins.bedgraph [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr206-MV411-PBS_6h-r2_tcount.tsv [Content-Type=text/tab-separated-values]...
Copying file://../../data/slamseqMax/res/count/mr207-MV411-PBS_6h-r3_tcount.tsv [Content-Type=text/tab-separated-values]...
Copying file://../../data/slamseqMax/res/count/mr194-MV411-MYBi_30m-r2_tcount_mins.bedgraph [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr216-MV411-MS2_JQ1-r3_tcount.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr198-MV411-PBS_30m-r2_tcount.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr200-MV411-PBS_30m-r4_tcount.tsv [Content-Type=text/tab-separated-values]...
Copying file://../../data/slamseqMax/res/count/mr194-MV411-MYBi_30m-r2_tcount.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr206-MV411-PBS_6h-r2_tcount.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr195-MV411-MYBi_30m-r3_tcount.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr201-MV411-MYBi_6h-r1_tcount.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr208-MV411-MS2-r1_tcount.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr215-MV411-MS2_JQ1-r2_tcount_plus.bedgraph [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr198-MV411-PBS_30m-r2_tcount.tsv [Content-Type=text/tab-separated-values]...
Copying file://../../data/slamseqMax/res/count/mr210-MV411-MS2-r3_tcount.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr205-MV411-PBS_6h-r1_tcount_plus.bedgraph [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr195-MV411-MYBi_30m-r3_tcount.tsv [Content-Type=text/tab-separated-values]...
Copying file://../../data/slamseqMax/res/count/mr193-MV411-MYBi_30m-r1_tcount_plus.bedgraph [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr213-MV411-JQ1-r3_tcount_plus.bedgraph [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr207-MV411-PBS_6h-r3_tcount_mins.bedgraph [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr219-MV411-DMSO-r3_tcount.tsv [Content-Type=text/tab-separated-values]...
Copying file://../../data/slamseqMax/res/count/mr218-MV411-DMSO-r2_tcount.tsv [Content-Type=text/tab-separated-values]...
Copying file://../../data/slamseqMax/res/count/mr219-MV411-DMSO-r3_tcount_mins.bedgraph [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr193-MV411-MYBi_30m-r1_tcount.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr199-MV411-PBS_30m-r3_tcount_plus.bedgraph [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr211-MV411-JQ1-r1_tcount.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr218-MV411-DMSO-r2_tcount.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr202-MV411-MYBi_6h-r2_tcount.tsv [Content-Type=text/tab-separated-values]...
Copying file://../../data/slamseqMax/res/count/mr198-MV411-PBS_30m-r2_tcount_plus.bedgraph [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr209-MV411-MS2-r2_tcount.tsv [Content-Type=text/tab-separated-values]...
Copying file://../../data/slamseqMax/res/count/mr197-MV411-PBS_30m-r1_tcount_mins.bedgraph [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr212-MV411-JQ1-r2_tcount_mins.bedgraph [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr210-MV411-MS2-r3_tcount_plus.bedgraph [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr205-MV411-PBS_6h-r1_tcount_mins.bedgraph [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr212-MV411-JQ1-r2_tcount_plus.bedgraph [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr219-MV411-DMSO-r3_tcount.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr212-MV411-JQ1-r2_tcount.tsv [Content-Type=text/tab-separated-values]...
Copying file://../../data/slamseqMax/res/count/mr211-MV411-JQ1-r1_tcount_plus.bedgraph [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr204-MV411-MYBi_6h-r4_tcount.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr217-MV411-DMSO-r1_tcount.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr215-MV411-MS2_JQ1-r2_tcount_mins.bedgraph [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr214-MV411-MS2_JQ1-r1_tcount.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr195-MV411-MYBi_30m-r3_tcount_plus.bedgraph [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr197-MV411-PBS_30m-r1_tcount_plus.bedgraph [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr214-MV411-MS2_JQ1-r1_tcount_plus.bedgraph [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr204-MV411-MYBi_6h-r4_tcount_mins.bedgraph [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr200-MV411-PBS_30m-r4_tcount.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr200-MV411-PBS_30m-r4_tcount_mins.bedgraph [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr201-MV411-MYBi_6h-r1_tcount.tsv [Content-Type=text/tab-separated-values]...
Copying file://../../data/slamseqMax/res/count/mr217-MV411-DMSO-r1_tcount.tsv [Content-Type=text/tab-separated-values]...
Copying file://../../data/slamseqMax/res/count/mr196-MV411-MYBi_30m-r4_tcount.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr202-MV411-MYBi_6h-r2_tcount.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr213-MV411-JQ1-r3_tcount.tsv [Content-Type=text/tab-separated-values]...
Copying file://../../data/slamseqMax/res/count/mr203-MV411-MYBi_6h-r3_tcount_plus.bedgraph [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr215-MV411-MS2_JQ1-r2_tcount.tsv [Content-Type=text/tab-separated-values]...
Copying file://../../data/slamseqMax/res/count/mr208-MV411-MS2-r1_tcount.tsv [Content-Type=text/tab-separated-values]...
Copying file://../../data/slamseqMax/res/count/mr214-MV411-MS2_JQ1-r1_tcount.tsv [Content-Type=text/tab-separated-values]...
Copying file://../../data/slamseqMax/res/count/mr206-MV411-PBS_6h-r2_tcount_mins.bedgraph [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr205-MV411-PBS_6h-r1_tcount.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr216-MV411-MS2_JQ1-r3_tcount_plus.bedgraph [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr209-MV411-MS2-r2_tcount_mins.bedgraph [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr216-MV411-MS2_JQ1-r3_tcount.tsv [Content-Type=text/tab-separated-values]...
Copying file://../../data/slamseqMax/res/count/mr209-MV411-MS2-r2_tcount_plus.bedgraph [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr193-MV411-MYBi_30m-r1_tcount.tsv [Content-Type=text/tab-separated-values]...
Copying file://../../data/slamseqMax/res/count/mr207-MV411-PBS_6h-r3_tcount.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr217-MV411-DMSO-r1_tcount_mins.bedgraph [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr201-MV411-MYBi_6h-r1_tcount_plus.bedgraph [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr208-MV411-MS2-r1_tcount_plus.bedgraph [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr218-MV411-DMSO-r2_tcount_plus.bedgraph [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr205-MV411-PBS_6h-r1_tcount.tsv [Content-Type=text/tab-separated-values]...
Copying file://../../data/slamseqMax/res/count/mr196-MV411-MYBi_30m-r4_tcount_mins.bedgraph [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr219-MV411-DMSO-r3_tcount_plus.bedgraph [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr216-MV411-MS2_JQ1-r3_tcount_mins.bedgraph [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr199-MV411-PBS_30m-r3_tcount.tsv [Content-Type=text/tab-separated-values]...
Copying file://../../data/slamseqMax/res/count/mr208-MV411-MS2-r1_tcount_mins.bedgraph [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr198-MV411-PBS_30m-r2_tcount_mins.bedgraph [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr197-MV411-PBS_30m-r1_tcount.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr194-MV411-MYBi_30m-r2_tcount_plus.bedgraph [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr209-MV411-MS2-r2_tcount.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr199-MV411-PBS_30m-r3_tcount_mins.bedgraph [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr204-MV411-MYBi_6h-r4_tcount.tsv [Content-Type=text/tab-separated-values]...
Copying file://../../data/slamseqMax/res/count/mr203-MV411-MYBi_6h-r3_tcount.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/count/mr200-MV411-PBS_30m-r4_tcount_plus.bedgraph [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/map/mr215-MV411-MS2_JQ1-r2_slamdunk_mapped.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/map/mr216-MV411-MS2_JQ1-r3_slamdunk_mapped.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/map/mr218-MV411-DMSO-r2_slamdunk_mapped.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/map/mr219-MV411-DMSO-r3_slamdunk_mapped.bam [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/map/mr216-MV411-MS2_JQ1-r3_slamdunk_mapped.bam [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/map/mr218-MV411-DMSO-r2_slamdunk_mapped.bam [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/map/mr217-MV411-DMSO-r1_slamdunk_mapped.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/map/mr217-MV411-DMSO-r1_slamdunk_mapped.bam [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/map/mr215-MV411-MS2_JQ1-r2_slamdunk_mapped.bam [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/map/mr219-MV411-DMSO-r3_slamdunk_mapped.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/snp/mr211-MV411-JQ1-r1_snp.vcf [Content-Type=text/vcard]...
Copying file://../../data/slamseqMax/res/snp/mr214-MV411-MS2_JQ1-r1_snp.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/snp/mr206-MV411-PBS_6h-r2_snp.vcf [Content-Type=text/vcard]...
Copying file://../../data/slamseqMax/res/snp/mr193-MV411-MYBi_30m-r1_snp.vcf [Content-Type=text/vcard]...
Copying file://../../data/slamseqMax/res/snp/mr210-MV411-MS2-r3_snp.vcf [Content-Type=text/vcard]...
Copying file://../../data/slamseqMax/res/snp/mr213-MV411-JQ1-r3_snp.vcf [Content-Type=text/vcard]...
Copying file://../../data/slamseqMax/res/snp/mr203-MV411-MYBi_6h-r3_snp.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/snp/mr217-MV411-DMSO-r1_snp.vcf [Content-Type=text/vcard]...
Copying file://../../data/slamseqMax/res/snp/mr200-MV411-PBS_30m-r4_snp.vcf [Content-Type=text/vcard]...
Copying file://../../data/slamseqMax/res/snp/mr195-MV411-MYBi_30m-r3_snp.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/snp/mr214-MV411-MS2_JQ1-r1_snp.vcf [Content-Type=text/vcard]...
Copying file://../../data/slamseqMax/res/snp/mr218-MV411-DMSO-r2_snp.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/snp/mr201-MV411-MYBi_6h-r1_snp.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/snp/mr210-MV411-MS2-r3_snp.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/snp/mr197-MV411-PBS_30m-r1_snp.vcf [Content-Type=text/vcard]...
Copying file://../../data/slamseqMax/res/snp/mr217-MV411-DMSO-r1_snp.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/snp/mr208-MV411-MS2-r1_snp.vcf [Content-Type=text/vcard]...
Copying file://../../data/slamseqMax/res/snp/mr201-MV411-MYBi_6h-r1_snp.vcf [Content-Type=text/vcard]...
Copying file://../../data/slamseqMax/res/snp/mr202-MV411-MYBi_6h-r2_snp.vcf [Content-Type=text/vcard]...
Copying file://../../data/slamseqMax/res/snp/mr193-MV411-MYBi_30m-r1_snp.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/snp/mr213-MV411-JQ1-r3_snp.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/snp/mr216-MV411-MS2_JQ1-r3_snp.vcf [Content-Type=text/vcard]...
Copying file://../../data/slamseqMax/res/snp/mr211-MV411-JQ1-r1_snp.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/snp/mr207-MV411-PBS_6h-r3_snp.vcf [Content-Type=text/vcard]...
Copying file://../../data/slamseqMax/res/snp/mr208-MV411-MS2-r1_snp.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/snp/mr216-MV411-MS2_JQ1-r3_snp.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/snp/mr212-MV411-JQ1-r2_snp.vcf [Content-Type=text/vcard]...
Copying file://../../data/slamseqMax/res/snp/mr196-MV411-MYBi_30m-r4_snp.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/snp/mr196-MV411-MYBi_30m-r4_snp.vcf [Content-Type=text/vcard]...
Copying file://../../data/slamseqMax/res/snp/mr209-MV411-MS2-r2_snp.vcf [Content-Type=text/vcard]...
Copying file://../../data/slamseqMax/res/snp/mr197-MV411-PBS_30m-r1_snp.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/snp/mr198-MV411-PBS_30m-r2_snp.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/snp/mr200-MV411-PBS_30m-r4_snp.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/snp/mr199-MV411-PBS_30m-r3_snp.vcf [Content-Type=text/vcard]...
Copying file://../../data/slamseqMax/res/snp/mr199-MV411-PBS_30m-r3_snp.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/snp/mr205-MV411-PBS_6h-r1_snp.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/snp/mr203-MV411-MYBi_6h-r3_snp.vcf [Content-Type=text/vcard]...
Copying file://../../data/slamseqMax/res/snp/mr209-MV411-MS2-r2_snp.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/snp/mr204-MV411-MYBi_6h-r4_snp.vcf [Content-Type=text/vcard]...
Copying file://../../data/slamseqMax/res/snp/mr215-MV411-MS2_JQ1-r2_snp.vcf [Content-Type=text/vcard]...
Copying file://../../data/slamseqMax/res/snp/mr218-MV411-DMSO-r2_snp.vcf [Content-Type=text/vcard]...
Copying file://../../data/slamseqMax/res/snp/mr206-MV411-PBS_6h-r2_snp.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/snp/mr215-MV411-MS2_JQ1-r2_snp.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/snp/mr212-MV411-JQ1-r2_snp.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/snp/mr207-MV411-PBS_6h-r3_snp.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/snp/mr219-MV411-DMSO-r3_snp.vcf [Content-Type=text/vcard]...
Copying file://../../data/slamseqMax/res/snp/mr219-MV411-DMSO-r3_snp.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/snp/mr205-MV411-PBS_6h-r1_snp.vcf [Content-Type=text/vcard]...
Copying file://../../data/slamseqMax/res/snp/mr194-MV411-MYBi_30m-r2_snp.vcf [Content-Type=text/vcard]...
Copying file://../../data/slamseqMax/res/snp/mr194-MV411-MYBi_30m-r2_snp.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/snp/mr202-MV411-MYBi_6h-r2_snp.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/snp/mr195-MV411-MYBi_30m-r3_snp.vcf [Content-Type=text/vcard]...
Copying file://../../data/slamseqMax/res/snp/mr204-MV411-MYBi_6h-r4_snp.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/snp/mr198-MV411-PBS_30m-r2_snp.vcf [Content-Type=text/vcard]...
Copying file://../../data/slamseqMax/res/filter/mr193-MV411-MYBi_30m-r1_filtered.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr209-MV411-MS2-r2_filtered.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr215-MV411-MS2_JQ1-r2_filtered.bam [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr207-MV411-PBS_6h-r3_filtered.bam.bai [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr197-MV411-PBS_30m-r1_filtered.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr197-MV411-PBS_30m-r1_filtered.bam [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr216-MV411-MS2_JQ1-r3_filtered.bam.bai [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr196-MV411-MYBi_30m-r4_filtered.bam.bai [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr216-MV411-MS2_JQ1-r3_filtered.bam [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr194-MV411-MYBi_30m-r2_filtered.bam [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr219-MV411-DMSO-r3_filtered.bam [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr218-MV411-DMSO-r2_filtered.bam [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr204-MV411-MYBi_6h-r4_filtered.bam [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr206-MV411-PBS_6h-r2_filtered.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr203-MV411-MYBi_6h-r3_filtered.bam.bai [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr214-MV411-MS2_JQ1-r1_filtered.bam.bai [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr214-MV411-MS2_JQ1-r1_filtered.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr206-MV411-PBS_6h-r2_filtered.bam.bai [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr211-MV411-JQ1-r1_filtered.bam [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr206-MV411-PBS_6h-r2_filtered.bam [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr195-MV411-MYBi_30m-r3_filtered.bam [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr219-MV411-DMSO-r3_filtered.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr216-MV411-MS2_JQ1-r3_filtered.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr202-MV411-MYBi_6h-r2_filtered.bam.bai [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr198-MV411-PBS_30m-r2_filtered.bam [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr207-MV411-PBS_6h-r3_filtered.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr201-MV411-MYBi_6h-r1_filtered.bam [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr217-MV411-DMSO-r1_filtered.bam.bai [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr208-MV411-MS2-r1_filtered.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr208-MV411-MS2-r1_filtered.bam.bai [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr205-MV411-PBS_6h-r1_filtered.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr217-MV411-DMSO-r1_filtered.bam [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr204-MV411-MYBi_6h-r4_filtered.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr196-MV411-MYBi_30m-r4_filtered.bam [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr194-MV411-MYBi_30m-r2_filtered.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr195-MV411-MYBi_30m-r3_filtered.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr214-MV411-MS2_JQ1-r1_filtered.bam [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr198-MV411-PBS_30m-r2_filtered.bam.bai [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr213-MV411-JQ1-r3_filtered.bam.bai [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr199-MV411-PBS_30m-r3_filtered.bam [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr201-MV411-MYBi_6h-r1_filtered.bam.bai [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr211-MV411-JQ1-r1_filtered.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr210-MV411-MS2-r3_filtered.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr197-MV411-PBS_30m-r1_filtered.bam.bai [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr215-MV411-MS2_JQ1-r2_filtered.bam.bai [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr202-MV411-MYBi_6h-r2_filtered.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr203-MV411-MYBi_6h-r3_filtered.bam [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr211-MV411-JQ1-r1_filtered.bam.bai [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr201-MV411-MYBi_6h-r1_filtered.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr200-MV411-PBS_30m-r4_filtered.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr199-MV411-PBS_30m-r3_filtered.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr200-MV411-PBS_30m-r4_filtered.bam [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr200-MV411-PBS_30m-r4_filtered.bam.bai [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr195-MV411-MYBi_30m-r3_filtered.bam.bai [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr212-MV411-JQ1-r2_filtered.bam.bai [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr207-MV411-PBS_6h-r3_filtered.bam [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr208-MV411-MS2-r1_filtered.bam [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr204-MV411-MYBi_6h-r4_filtered.bam.bai [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr194-MV411-MYBi_30m-r2_filtered.bam.bai [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr212-MV411-JQ1-r2_filtered.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr210-MV411-MS2-r3_filtered.bam [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr215-MV411-MS2_JQ1-r2_filtered.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr193-MV411-MYBi_30m-r1_filtered.bam [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr198-MV411-PBS_30m-r2_filtered.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr209-MV411-MS2-r2_filtered.bam.bai [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr205-MV411-PBS_6h-r1_filtered.bam [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr203-MV411-MYBi_6h-r3_filtered.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr202-MV411-MYBi_6h-r2_filtered.bam [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr213-MV411-JQ1-r3_filtered.bam [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr218-MV411-DMSO-r2_filtered.bam.bai [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr212-MV411-JQ1-r2_filtered.bam [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr210-MV411-MS2-r3_filtered.bam.bai [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr219-MV411-DMSO-r3_filtered.bam.bai [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr196-MV411-MYBi_30m-r4_filtered.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr199-MV411-PBS_30m-r3_filtered.bam.bai [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr205-MV411-PBS_6h-r1_filtered.bam.bai [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr217-MV411-DMSO-r1_filtered.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr209-MV411-MS2-r2_filtered.bam [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr218-MV411-DMSO-r2_filtered.log [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr193-MV411-MYBi_30m-r1_filtered.bam.bai [Content-Type=application/octet-stream]...
Copying file://../../data/slamseqMax/res/filter/mr213-MV411-JQ1-r3_filtered.log [Content-Type=application/octet-stream]...
| [415/415 files][305.7 GiB/305.7 GiB] 100% Done 109.3 MiB/s ETA 00:00:00       
Operation completed over 415 objects/305.7 GiB.                                  

Getting counts over ERCC genome

In [496]:
counts = {}
folder = "../../data/slamseqMax/res/filter"
files = ! ls $folder/ERCC*
files = [file.split('/')[-1] for file in files if file.endswith(".bam")]
In [445]:
parrun(["samtools view -hb "+folder+"/"+f+" ERCC-00002 ERCC-00003 ERCC-00004 ERCC-00009 ERCC-00012 ERCC-00013 ERCC-00014 ERCC-00016 ERCC-00017 ERCC-00019 ERCC-00022 ERCC-00024 ERCC-00025 ERCC-00028 ERCC-00031 ERCC-00033 ERCC-00034 ERCC-00035 ERCC-00039 ERCC-00040 ERCC-00041 ERCC-00042 ERCC-00043 ERCC-00044 ERCC-00046 ERCC-00048 ERCC-00051 ERCC-00053 ERCC-00054 ERCC-00057 ERCC-00058 ERCC-00059 ERCC-00060 ERCC-00061 ERCC-00062 ERCC-00067 ERCC-00069 ERCC-00071 ERCC-00073 ERCC-00074 ERCC-00075 ERCC-00076 ERCC-00077 ERCC-00078 ERCC-00079 ERCC-00081 ERCC-00083 ERCC-00084 ERCC-00085 ERCC-00086 ERCC-00092 ERCC-00095 ERCC-00096 ERCC-00097 ERCC-00098 ERCC-00099 ERCC-00104 ERCC-00108 ERCC-00109 ERCC-00111 ERCC-00112 ERCC-00113 ERCC-00116 ERCC-00117 ERCC-00120 ERCC-00123 ERCC-00126 ERCC-00130 ERCC-00131 ERCC-00134 ERCC-00136 ERCC-00137 ERCC-00138 ERCC-00142 ERCC-00143 ERCC-00144 ERCC-00145 ERCC-00147 ERCC-00148 ERCC-00150 ERCC-00154 ERCC-00156 ERCC-00157 ERCC-00158 ERCC-00160 ERCC-00162 ERCC-00163 ERCC-00164 ERCC-00165 ERCC-00168 ERCC-00170 ERCC-00171 > "+folder+"/ERCC_"+f for f in files],cores=10)
---------------------------------------------------------------------------
ValueError                                Traceback (most recent call last)
<ipython-input-445-d538394e2432> in <module>
----> 1 parrun(["samtools view -hb "+folder+"/"+f+" ERCC-00002 ERCC-00003 ERCC-00004 ERCC-00009 ERCC-00012 ERCC-00013 ERCC-00014 ERCC-00016 ERCC-00017 ERCC-00019 ERCC-00022 ERCC-00024 ERCC-00025 ERCC-00028 ERCC-00031 ERCC-00033 ERCC-00034 ERCC-00035 ERCC-00039 ERCC-00040 ERCC-00041 ERCC-00042 ERCC-00043 ERCC-00044 ERCC-00046 ERCC-00048 ERCC-00051 ERCC-00053 ERCC-00054 ERCC-00057 ERCC-00058 ERCC-00059 ERCC-00060 ERCC-00061 ERCC-00062 ERCC-00067 ERCC-00069 ERCC-00071 ERCC-00073 ERCC-00074 ERCC-00075 ERCC-00076 ERCC-00077 ERCC-00078 ERCC-00079 ERCC-00081 ERCC-00083 ERCC-00084 ERCC-00085 ERCC-00086 ERCC-00092 ERCC-00095 ERCC-00096 ERCC-00097 ERCC-00098 ERCC-00099 ERCC-00104 ERCC-00108 ERCC-00109 ERCC-00111 ERCC-00112 ERCC-00113 ERCC-00116 ERCC-00117 ERCC-00120 ERCC-00123 ERCC-00126 ERCC-00130 ERCC-00131 ERCC-00134 ERCC-00136 ERCC-00137 ERCC-00138 ERCC-00142 ERCC-00143 ERCC-00144 ERCC-00145 ERCC-00147 ERCC-00148 ERCC-00150 ERCC-00154 ERCC-00156 ERCC-00157 ERCC-00158 ERCC-00160 ERCC-00162 ERCC-00163 ERCC-00164 ERCC-00165 ERCC-00168 ERCC-00170 ERCC-00171 > "+folder+"/"+f for f in files],cores=10)

~/JKBio/Helper.py in parrun(cmds, cores, add)
    803       res = subprocess.run(exe, capture_output=True, shell=True)
    804       if res.returncode != 0:
--> 805         raise ValueError('issue with the command: ' + str(res.stderr))
    806       exe = ''
    807       if len(add) != 0:

ValueError: issue with the command: b'[main_samview] random alignment retrieval only works for indexed BAM or CRAM files.\n[main_samview] random alignment retrieval only works for indexed BAM or CRAM files.\n[main_samview] random alignment retrieval only works for indexed BAM or CRAM files.\n[main_samview] random alignment retrieval only works for indexed BAM or CRAM files.\n[main_samview] random alignment retrieval only works for indexed BAM or CRAM files.\n[main_samview] random alignment retrieval only works for indexed BAM or CRAM files.\n[main_samview] random alignment retrieval only works for indexed BAM or CRAM files.\n[main_samview] random alignment retrieval only works for indexed BAM or CRAM files.\n[main_samview] random alignment retrieval only works for indexed BAM or CRAM files.\n[main_samview] random alignment retrieval only works for indexed BAM or CRAM files.\n'
In [486]:
parrun(["bedtools genomecov -ibam "+folder+"/ERCC_"+f+" > "+folder+"/"+f+".bed" for f in files],cores=10)
In [498]:
files
Out[498]:
['mr193-MV411-MYBi_30m-r1_filtered.bam.bed',
 'mr194-MV411-MYBi_30m-r2_filtered.bam.bed',
 'mr195-MV411-MYBi_30m-r3_filtered.bam.bed',
 'mr196-MV411-MYBi_30m-r4_filtered.bam.bed',
 'mr197-MV411-PBS_30m-r1_filtered.bam.bed',
 'mr198-MV411-PBS_30m-r2_filtered.bam.bed',
 'mr199-MV411-PBS_30m-r3_filtered.bam.bed',
 'mr200-MV411-PBS_30m-r4_filtered.bam.bed',
 'mr201-MV411-MYBi_6h-r1_filtered.bam.bed',
 'mr202-MV411-MYBi_6h-r2_filtered.bam.bed',
 'mr203-MV411-MYBi_6h-r3_filtered.bam.bed',
 'mr204-MV411-MYBi_6h-r4_filtered.bam.bed',
 'mr205-MV411-PBS_6h-r1_filtered.bam.bed',
 'mr206-MV411-PBS_6h-r2_filtered.bam.bed',
 'mr207-MV411-PBS_6h-r3_filtered.bam.bed',
 'mr208-MV411-MS2-r1_filtered.bam.bed',
 'mr209-MV411-MS2-r2_filtered.bam.bed',
 'mr210-MV411-MS2-r3_filtered.bam.bed',
 'mr211-MV411-JQ1-r1_filtered.bam.bed',
 'mr212-MV411-JQ1-r2_filtered.bam.bed',
 'mr213-MV411-JQ1-r3_filtered.bam.bed',
 'mr214-MV411-MS2_JQ1-r1_filtered.bam.bed',
 'mr215-MV411-MS2_JQ1-r2_filtered.bam.bed',
 'mr216-MV411-MS2_JQ1-r3_filtered.bam.bed',
 'mr217-MV411-DMSO-r1_filtered.bam.bed',
 'mr218-MV411-DMSO-r2_filtered.bam.bed',
 'mr219-MV411-DMSO-r3_filtered.bam.bed',
 'mr252-MV411_MEF2D-DMSO_2h-r1_filtered.bam.bed',
 'mr253-MV411_MEF2D-DMSO_2h-r2_filtered.bam.bed',
 'mr254-MV411_MEF2D-DMSO_2h-r3_filtered.bam.bed',
 'mr255-MV411_MEF2D-DMSO_2h-r4_filtered.bam.bed',
 'mr256-MV411_MEF2D-VHL_2h-r1_filtered.bam.bed',
 'mr257-MV411_MEF2D-VHL_2h-r2_filtered.bam.bed',
 'mr258-MV411_MEF2D-VHL_2h-r3_filtered.bam.bed',
 'mr259-MV411_MEF2D-VHL_2h-r4_filtered.bam.bed',
 'mr260-MV411_MEF2D-DMSO_24h-r1_filtered.bam.bed',
 'mr261-MV411_MEF2D-DMSO_24h-r2_filtered.bam.bed',
 'mr262-MV411_MEF2D-DMSO_24h-r3_filtered.bam.bed',
 'mr263-MV411_MEF2D-DMSO_24h-r4_filtered.bam.bed',
 'mr264-MV411_MEF2D-VHL_24h-r1_filtered.bam.bed',
 'mr265-MV411_MEF2D-VHL_24h-r2_filtered.bam.bed',
 'mr266-MV411_MEF2D-VHL_24h-r3_filtered.bam.bed',
 'mr267-MV411_MEF2D-VHL_24h-r4_filtered.bam.bed',
 'mr268-MV411-PBS_24h-r1_filtered.bam.bed',
 'mr269-MV411-PBS_24h-r2_filtered.bam.bed',
 'mr270-MV411-PBS_24h-r3_filtered.bam.bed',
 'mr271-MV411-PBS_24h-r4_filtered.bam.bed',
 'mr272-MV411-MYBi_24h-r1_filtered.bam.bed',
 'mr273-MV411-MYBi_24h-r2_filtered.bam.bed',
 'mr274-MV411-MYBi_24h-r3_filtered.bam.bed']
In [499]:
ERCC = ["ERCC-00002", "ERCC-00003", "ERCC-00004", "ERCC-00009", "ERCC-00012", "ERCC-00013", "ERCC-00014", "ERCC-00016", "ERCC-00017", "ERCC-00019", "ERCC-00022", "ERCC-00024", "ERCC-00025", "ERCC-00028", "ERCC-00031", "ERCC-00033", "ERCC-00034", "ERCC-00035", "ERCC-00039", "ERCC-00040", "ERCC-00041", "ERCC-00042", "ERCC-00043", "ERCC-00044", "ERCC-00046", "ERCC-00048", "ERCC-00051", "ERCC-00053", "ERCC-00054", "ERCC-00057", "ERCC-00058", "ERCC-00059", "ERCC-00060", "ERCC-00061", "ERCC-00062", "ERCC-00067", "ERCC-00069", "ERCC-00071", "ERCC-00073", "ERCC-00074", "ERCC-00075", "ERCC-00076", "ERCC-00077", "ERCC-00078", "ERCC-00079", "ERCC-00081", "ERCC-00083", "ERCC-00084", "ERCC-00085", "ERCC-00086", "ERCC-00092", "ERCC-00095", "ERCC-00096", "ERCC-00097", "ERCC-00098", "ERCC-00099", "ERCC-00104", "ERCC-00108", "ERCC-00109", "ERCC-00111", "ERCC-00112", "ERCC-00113", "ERCC-00116", "ERCC-00117", "ERCC-00120", "ERCC-00123", "ERCC-00126", "ERCC-00130", "ERCC-00131", "ERCC-00134", "ERCC-00136", "ERCC-00137", "ERCC-00138", "ERCC-00142", "ERCC-00143", "ERCC-00144", "ERCC-00145", "ERCC-00147", "ERCC-00148", "ERCC-00150", "ERCC-00154", "ERCC-00156", "ERCC-00157", "ERCC-00158", "ERCC-00160", "ERCC-00162", "ERCC-00163", "ERCC-00164", "ERCC-00165", "ERCC-00168", "ERCC-00170", "ERCC-00171"]
res  = {i:[] for i in files}
for val in files:
    cov = pd.read_csv(folder+"/"+val,sep="\t",header=None)
    for i in ERCC:
        res[val].append(cov[cov[0]==i][1].mean())
df = pd.DataFrame(data=res,index=ERCC)
In [80]:
totalcounts = ! for unkn in $(ls ../../data/slamseqMax/res/filter/mr*.bam); do samtools view -c -F 260 $unkn; done
In [500]:
totalcounts= [
52834953,
48661773,
99303819,
45979870,
71673717,
90428614,
51950460,
75989518,
41520582,
44914503,
34919910,
34840133,
44955360,
50106552,
47137700,
148549270,
103180767,
160756237,
128740743,
109673222,
130928802,
147257131,
149990181,
155634820,
116426167,
124950994,
86078120,
87120807,
83131772,
169547340,
162737874,
60636179,
101791667,
149282005,
130879596,
204252217,
74266908,
124166412,
109829880,
79024803,
126029299,
93542923,
107586723,
85905103,
31694204,
128780021,
37635249,
36638284,
75047033,
83424257]
In [502]:
res = 10000*df.mean()/totalcounts
In [503]:
res
Out[503]:
mr193-MV411-MYBi_30m-r1_filtered.bam.bed          0.391405
mr194-MV411-MYBi_30m-r2_filtered.bam.bed          0.744062
mr195-MV411-MYBi_30m-r3_filtered.bam.bed          0.693672
mr196-MV411-MYBi_30m-r4_filtered.bam.bed          0.388357
mr197-MV411-PBS_30m-r1_filtered.bam.bed           0.240919
mr198-MV411-PBS_30m-r2_filtered.bam.bed           0.286953
mr199-MV411-PBS_30m-r3_filtered.bam.bed           0.234265
mr200-MV411-PBS_30m-r4_filtered.bam.bed           0.278041
mr201-MV411-MYBi_6h-r1_filtered.bam.bed           0.573790
mr202-MV411-MYBi_6h-r2_filtered.bam.bed           0.472173
mr203-MV411-MYBi_6h-r3_filtered.bam.bed           0.496356
mr204-MV411-MYBi_6h-r4_filtered.bam.bed           0.459814
mr205-MV411-PBS_6h-r1_filtered.bam.bed            0.168788
mr206-MV411-PBS_6h-r2_filtered.bam.bed            0.230918
mr207-MV411-PBS_6h-r3_filtered.bam.bed            0.317403
mr208-MV411-MS2-r1_filtered.bam.bed               0.219222
mr209-MV411-MS2-r2_filtered.bam.bed               0.088623
mr210-MV411-MS2-r3_filtered.bam.bed               0.127521
mr211-MV411-JQ1-r1_filtered.bam.bed               0.073249
mr212-MV411-JQ1-r2_filtered.bam.bed               0.110339
mr213-MV411-JQ1-r3_filtered.bam.bed               0.134256
mr214-MV411-MS2_JQ1-r1_filtered.bam.bed           0.147830
mr215-MV411-MS2_JQ1-r2_filtered.bam.bed           0.267151
mr216-MV411-MS2_JQ1-r3_filtered.bam.bed           0.191032
mr217-MV411-DMSO-r1_filtered.bam.bed              0.161530
mr218-MV411-DMSO-r2_filtered.bam.bed              0.135641
mr219-MV411-DMSO-r3_filtered.bam.bed              0.141818
mr252-MV411_MEF2D-DMSO_2h-r1_filtered.bam.bed     0.220618
mr253-MV411_MEF2D-DMSO_2h-r2_filtered.bam.bed     0.234046
mr254-MV411_MEF2D-DMSO_2h-r3_filtered.bam.bed     0.251439
mr255-MV411_MEF2D-DMSO_2h-r4_filtered.bam.bed     0.191159
mr256-MV411_MEF2D-VHL_2h-r1_filtered.bam.bed      0.225943
mr257-MV411_MEF2D-VHL_2h-r2_filtered.bam.bed      0.226751
mr258-MV411_MEF2D-VHL_2h-r3_filtered.bam.bed      0.256114
mr259-MV411_MEF2D-VHL_2h-r4_filtered.bam.bed      0.231022
mr260-MV411_MEF2D-DMSO_24h-r1_filtered.bam.bed    0.149643
mr261-MV411_MEF2D-DMSO_24h-r2_filtered.bam.bed    0.131132
mr262-MV411_MEF2D-DMSO_24h-r3_filtered.bam.bed    0.143506
mr263-MV411_MEF2D-DMSO_24h-r4_filtered.bam.bed    0.137635
mr264-MV411_MEF2D-VHL_24h-r1_filtered.bam.bed     0.158762
mr265-MV411_MEF2D-VHL_24h-r2_filtered.bam.bed     0.176088
mr266-MV411_MEF2D-VHL_24h-r3_filtered.bam.bed     0.263525
mr267-MV411_MEF2D-VHL_24h-r4_filtered.bam.bed     0.185894
mr268-MV411-PBS_24h-r1_filtered.bam.bed           0.270967
mr269-MV411-PBS_24h-r2_filtered.bam.bed           0.322324
mr270-MV411-PBS_24h-r3_filtered.bam.bed           0.183615
mr271-MV411-PBS_24h-r4_filtered.bam.bed           0.164630
mr272-MV411-MYBi_24h-r1_filtered.bam.bed          1.131675
mr273-MV411-MYBi_24h-r2_filtered.bam.bed          0.819142
mr274-MV411-MYBi_24h-r3_filtered.bam.bed          1.061710
dtype: float64
In [301]:
r = {'MYBi_30m': [0.5543739168045854, 0.1654583646526328], #r at v1
 'PBS_30m': [0.2600444176284328, 0.02279444794903803],
 'MYBi_6h': [0.5005330862395866, 0.04428975746477769],
 'PBS_6h': [0.23903615815004206, 0.060942601783761284],
 'MS2': [0.14512165615335024, 0.054750165018263075],
 'JQ1': [0.10594775516310602, 0.025098518494594674],
 'MS2_JQ1': [0.20200435554076682, 0.0493267432253527],
 'DMSO': [0.14632946312395476, 0.011039982545173618]}
In [504]:
prev=0
r={}
for val in [4,4,4,3,3,3,3,3,4,4,4,4,4,3]:
    r[res.keys()[prev].split('-')[2]]=[np.mean(res[prev:prev+val]), np.var(res[prev:prev+val])**(1/2)]
    prev+=val
In [ ]:
r = {'MYBi_30m': [0.5543739168045854, 0.1654583646526328], #r at v1
 'PBS_30m': [0.2600444176284328, 0.02279444794903803],
 'MYBi_6h': [0.5005330862395866, 0.04428975746477769],
 'PBS_6h': [0.23903615815004206, 0.060942601783761284],
 'MS2': [0.14512165615335024, 0.054750165018263075],
 'JQ1': [0.10594775516310602, 0.025098518494594674],
 'MS2_JQ1': [0.20200435554076682, 0.0493267432253527],
 'DMSO': [0.14632946312395476, 0.011039982545173618]}
In [91]:
r = {'DMSO_2h': [0.2243153232470735, 0.02204177171648129],
 'VHL_2h': [0.23495725535742493, 0.012366178880134462],
 'DMSO_24h': [0.14047889898493598, 0.0068663572605201255],
 'VHL_24h': [0.1960673739532328, 0.04013998428238451],
 'PBS_24h': [0.23538398133738964, 0.06424715552832781],
 'MYBi_24h': [1.0041758119681277, 0.13391993501133953]}
Out[91]:
{'DMSO_2h': [0.2243153232470735, 0.02204177171648129],
 'VHL_2h': [0.23495725535742493, 0.012366178880134462],
 'DMSO_24h': [0.14047889898493598, 0.0068663572605201255],
 'VHL_24h': [0.1960673739532328, 0.04013998428238451],
 'PBS_24h': [0.23538398133738964, 0.06424715552832781],
 'MYBi_24h': [1.0041758119681277, 0.13391993501133953]}
In [506]:
d= pd.DataFrame(data=r.values(),index=r.keys(), columns=['ERCC pseudo-counts','var'])
d['Experiments']=d.index
sns.barplot("Experiments","ERCC pseudo-counts",data=d,ci=None,)
plt.errorbar(x=range(0,len(d)),y=d['ERCC pseudo-counts'],
            yerr=d['var'], fmt='none', c= 'r')
plt.xticks(rotation=60,ha='right')
plt.savefig('../results/'+project+"/plots/"+version+"_scaling_fact_with_conf.pdf")
In [508]:
location= '../../data/'+project+'/res/count/'
mincount_toremove=5
minvar_toremove=0
In [509]:
readcounts, tccounts = readFromSlamdunk(loc=location,minvar_toremove=minvar_toremove, mincount_toremove=mincount_toremove)
found 50 files:dict_keys(['mr270-MV411-PBS_24h-r3_tcount', 'mr268-MV411-PBS_24h-r1_tcount', 'mr211-MV411-JQ1-r1_tcount', 'mr272-MV411-MYBi_24h-r1_tcount', 'mr203-MV411-MYBi_6h-r3_tcount', 'mr194-MV411-MYBi_30m-r2_tcount', 'mr197-MV411-PBS_30m-r1_tcount', 'mr210-MV411-MS2-r3_tcount', 'mr196-MV411-MYBi_30m-r4_tcount', 'mr269-MV411-PBS_24h-r2_tcount', 'mr263-MV411_MEF2D-DMSO_24h-r4_tcount', 'mr206-MV411-PBS_6h-r2_tcount', 'mr207-MV411-PBS_6h-r3_tcount', 'mr257-MV411_MEF2D-VHL_2h-r2_tcount', 'mr266-MV411_MEF2D-VHL_24h-r3_tcount', 'mr258-MV411_MEF2D-VHL_2h-r3_tcount', 'mr200-MV411-PBS_30m-r4_tcount', 'mr198-MV411-PBS_30m-r2_tcount', 'mr255-MV411_MEF2D-DMSO_2h-r4_tcount', 'mr195-MV411-MYBi_30m-r3_tcount', 'mr219-MV411-DMSO-r3_tcount', 'mr259-MV411_MEF2D-VHL_2h-r4_tcount', 'mr218-MV411-DMSO-r2_tcount', 'mr253-MV411_MEF2D-DMSO_2h-r2_tcount', 'mr261-MV411_MEF2D-DMSO_24h-r2_tcount', 'mr202-MV411-MYBi_6h-r2_tcount', 'mr209-MV411-MS2-r2_tcount', 'mr256-MV411_MEF2D-VHL_2h-r1_tcount', 'mr212-MV411-JQ1-r2_tcount', 'mr254-MV411_MEF2D-DMSO_2h-r3_tcount', 'mr264-MV411_MEF2D-VHL_24h-r1_tcount', 'mr262-MV411_MEF2D-DMSO_24h-r3_tcount', 'mr267-MV411_MEF2D-VHL_24h-r4_tcount', 'mr265-MV411_MEF2D-VHL_24h-r2_tcount', 'mr201-MV411-MYBi_6h-r1_tcount', 'mr273-MV411-MYBi_24h-r2_tcount', 'mr217-MV411-DMSO-r1_tcount', 'mr213-MV411-JQ1-r3_tcount', 'mr215-MV411-MS2_JQ1-r2_tcount', 'mr208-MV411-MS2-r1_tcount', 'mr214-MV411-MS2_JQ1-r1_tcount', 'mr271-MV411-PBS_24h-r4_tcount', 'mr216-MV411-MS2_JQ1-r3_tcount', 'mr193-MV411-MYBi_30m-r1_tcount', 'mr274-MV411-MYBi_24h-r3_tcount', 'mr260-MV411_MEF2D-DMSO_24h-r1_tcount', 'mr205-MV411-PBS_6h-r1_tcount', 'mr252-MV411_MEF2D-DMSO_2h-r1_tcount', 'mr199-MV411-PBS_30m-r3_tcount', 'mr204-MV411-MYBi_6h-r4_tcount'])
2023 538
[772, 243] [12, 5]
787 93
[709, 174] [2, 0]
1487 663
[2227, 635] [46, 7]
97 3
[533, 126] [4, 0]
206 26
[257, 45] [1, 1]
385 106
[785, 182] [0, 3]
1435 447
[1069, 291] [9, 3]
2044 951
[1823, 465] [40, 9]
308 76
[780, 189] [5, 1]
250 33
[295, 50] [0, 0]
2341 440
[621, 194] [1, 1]
558 226
[747, 158] [17, 6]
475 135
[617, 175] [13, 0]
556 148
[815, 209] [2, 0]
305 36
[468, 129] [0, 0]
1595 423
[1054, 244] [7, 0]
1667 617
[1179, 320] [22, 1]
1537 426
[1549, 380] [14, 4]
4857 2222
[958, 277] [7, 6]
836 203
[1412, 374] [7, 1]
792 318
[590, 185] [16, 2]
3671 1891
[712, 221] [17, 5]
1124 439
[1432, 378] [28, 4]
1688 530
[566, 148] [5, 1]
773 49
[551, 108] [1, 0]
253 20
[285, 79] [0, 1]
1202 408
[905, 248] [20, 11]
1321 543
[441, 120] [4, 0]
1069 364
[2102, 564] [27, 5]
5287 2163
[999, 303] [10, 3]
768 187
[285, 74] [5, 1]
2185 420
[661, 198] [6, 1]
503 61
[532, 132] [1, 0]
1656 532
[379, 114] [2, 2]
331 28
[308, 61] [1, 0]
809 22
[708, 149] [4, 0]
1130 553
[1157, 290] [38, 6]
1241 497
[2297, 594] [45, 8]
1567 496
[1057, 267] [7, 1]
1959 759
[1658, 421] [23, 2]
1412 474
[1177, 311] [11, 0]
153 19
[456, 110] [4, 0]
1938 688
[1139, 260] [12, 4]
415 90
[741, 188] [3, 1]
744 17
[1038, 139] [0, 0]
4751 861
[1176, 373] [9, 3]
515 187
[607, 133] [9, 1]
2177 721
[534, 160] [5, 0]
1112 403
[978, 227] [11, 3]
184 21
[256, 59] [1, 0]
you need access to taiga for this (https://pypi.org/project/taigapy/)
1118 could not be parsed... we don't have all genes already
you need access to taiga for this (https://pypi.org/project/taigapy/)
1118 could not be parsed... we don't have all genes already
In [317]:
#feel like subsetting?
readcounts = readcounts[readcounts.columns[:27]]
tccounts = tccounts[tccounts.columns[:27]]

SLAM-seq

All SLAM-seq assays were performed at 60-70% confluency for adherent cells or 60% of the maximum cell density counted on a hemocytometer for suspension cells. 5-7h prior to each assay, growth medium was aspirated and replaced. Unless stated otherwise, cells were pre-treated with indicated small molecule inhibitors or 100µM IAA for 30 min to pre-establish full target inhibition or degradation. Newly synthesized RNA was labeled for indicated time spans (45 min or 60 min) at a final concentration of 100µM 4- thiouridine (4sU, Carbosynth). Adherent cells were harvested by direct snap-freezing of plates on dry ice. Suspension cells were spun down and immediately snap-frozen. RNA extraction was performed using the RNeasy Plus Mini Kit (Qiagen).

Total RNA was subjected to alkylation by iodoacetamide (Sigma, 10mM) for 15 min and RNA was repurified by ethanol precipitation. 500ng alkylated RNA were used as input for generating 3’-end mRNA sequencing libraries using a commercially available kit (QuantSeq 3′ mRNA-Seq Library Prep Kit FWD for Illumina and PCR Add-on Kit for Illumina, Lexogen). Deep sequencing was performed using HiSeq1500 and HiSeq2500 platforms (Illumina).

0.06724463 0.04916348 0.03728357 0.05075007 0.03331248 0.0346662 0.03265504 0.04416262 0.05574821 0.05845953 0.05531433 0.06175393 0.03181749 0.02940226 0.0306263 0.04004278

In [66]:
mkdir ../results/$project
In [511]:
col = tccounts.columns.tolist()
col.sort()
tccounts = tccounts[col]
In [512]:
col = readcounts.columns.tolist()
col.sort()
readcounts = readcounts[col]
In [513]:
readcounts
Out[513]:
mr193-MV411-MYBi_30m-r1_tcount mr194-MV411-MYBi_30m-r2_tcount mr195-MV411-MYBi_30m-r3_tcount mr196-MV411-MYBi_30m-r4_tcount mr197-MV411-PBS_30m-r1_tcount mr198-MV411-PBS_30m-r2_tcount mr199-MV411-PBS_30m-r3_tcount mr200-MV411-PBS_30m-r4_tcount mr201-MV411-MYBi_6h-r1_tcount mr202-MV411-MYBi_6h-r2_tcount ... mr265-MV411_MEF2D-VHL_24h-r2_tcount mr266-MV411_MEF2D-VHL_24h-r3_tcount mr267-MV411_MEF2D-VHL_24h-r4_tcount mr268-MV411-PBS_24h-r1_tcount mr269-MV411-PBS_24h-r2_tcount mr270-MV411-PBS_24h-r3_tcount mr271-MV411-PBS_24h-r4_tcount mr272-MV411-MYBi_24h-r1_tcount mr273-MV411-MYBi_24h-r2_tcount mr274-MV411-MYBi_24h-r3_tcount
A1BG 2 0 0 0 0 1 0 2 0 0 ... 1 0 0 1 0 3 3 2 6 1
A2M 4 2 3 1 0 3 3 3 1 0 ... 0 0 0 0 0 1 0 0 1 0
NAT1 33 41 65 29 77 68 38 74 37 32 ... 222 71 34 90 43 175 25 9 63 38
AAMP 540 512 829 523 603 842 584 741 400 553 ... 1746 1507 1787 1238 428 1577 582 619 764 1199
AARS1 1230 1038 2124 1022 1616 2363 1263 1719 276 352 ... 1703 1464 1649 1398 754 1752 752 380 603 862
... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ...
107080638 281 221 502 264 408 517 274 359 138 132 ... 478 446 495 539 170 596 250 226 349 454
107080644 0 0 2 0 1 1 1 1 0 0 ... 3 0 3 4 0 0 0 0 3 0
BOLA2-SMG1P6 4 8 6 6 9 6 3 7 6 4 ... 22 29 39 9 3 23 7 5 4 7
107303344 126 96 230 81 165 200 145 161 33 25 ... 137 52 114 158 44 196 58 43 155 182
SCARNA18B 1 2 6 1 2 1 1 1 5 2 ... 2 1 0 0 0 0 0 0 9 6

16733 rows × 50 columns

In [517]:
 
Out[517]:
mr193-MV411-MYBi_30m-r1_tcount mr194-MV411-MYBi_30m-r2_tcount mr195-MV411-MYBi_30m-r3_tcount mr196-MV411-MYBi_30m-r4_tcount mr197-MV411-PBS_30m-r1_tcount mr198-MV411-PBS_30m-r2_tcount mr199-MV411-PBS_30m-r3_tcount mr200-MV411-PBS_30m-r4_tcount mr201-MV411-MYBi_6h-r1_tcount mr202-MV411-MYBi_6h-r2_tcount ... mr265-MV411_MEF2D-VHL_24h-r2_tcount mr266-MV411_MEF2D-VHL_24h-r3_tcount mr267-MV411_MEF2D-VHL_24h-r4_tcount mr268-MV411-PBS_24h-r1_tcount mr269-MV411-PBS_24h-r2_tcount mr270-MV411-PBS_24h-r3_tcount mr271-MV411-PBS_24h-r4_tcount mr272-MV411-MYBi_24h-r1_tcount mr273-MV411-MYBi_24h-r2_tcount mr274-MV411-MYBi_24h-r3_tcount
A1BG 0 0 0 0 0 0 0 0 0 0 ... 0 0 0 0 0 0 0 0 0 0
A2M 0 0 0 0 0 0 0 0 0 0 ... 0 0 0 0 0 0 0 0 0 0
NAT1 1 2 1 2 5 0 3 4 3 1 ... 3 0 0 1 0 9 0 0 0 0
AAMP 10 8 8 11 8 7 8 11 0 2 ... 15 0 1 7 0 21 0 0 0 0
AARS1 11 4 9 4 9 18 14 16 2 3 ... 10 0 2 2 0 19 1 0 0 2
... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ...
107080638 2 0 2 3 0 1 1 2 0 0 ... 4 0 0 0 0 1 0 0 0 0
107080644 0 0 0 0 0 0 0 0 0 0 ... 1 0 0 0 0 0 0 0 0 0
BOLA2-SMG1P6 0 0 0 1 0 0 0 1 0 0 ... 4 0 0 0 0 0 0 0 0 0
107303344 2 1 0 1 0 0 0 4 1 0 ... 0 0 0 0 0 1 0 0 1 0
SCARNA18B 0 0 1 0 0 0 1 0 0 0 ... 0 0 0 0 0 0 0 0 4 0

16256 rows × 50 columns

In [519]:
readcounts
Out[519]:
mr193-MV411-MYBi_30m-r1_tcount mr194-MV411-MYBi_30m-r2_tcount mr195-MV411-MYBi_30m-r3_tcount mr196-MV411-MYBi_30m-r4_tcount mr197-MV411-PBS_30m-r1_tcount mr198-MV411-PBS_30m-r2_tcount mr199-MV411-PBS_30m-r3_tcount mr200-MV411-PBS_30m-r4_tcount mr201-MV411-MYBi_6h-r1_tcount mr202-MV411-MYBi_6h-r2_tcount ... mr265-MV411_MEF2D-VHL_24h-r2_tcount mr266-MV411_MEF2D-VHL_24h-r3_tcount mr267-MV411_MEF2D-VHL_24h-r4_tcount mr268-MV411-PBS_24h-r1_tcount mr269-MV411-PBS_24h-r2_tcount mr270-MV411-PBS_24h-r3_tcount mr271-MV411-PBS_24h-r4_tcount mr272-MV411-MYBi_24h-r1_tcount mr273-MV411-MYBi_24h-r2_tcount mr274-MV411-MYBi_24h-r3_tcount
A1BG 2 0 0 0 0 1 0 2 0 0 ... 1 0 0 1 0 3 3 2 6 1
A2M 4 2 3 1 0 3 3 3 1 0 ... 0 0 0 0 0 1 0 0 1 0
NAT1 33 41 65 29 77 68 38 74 37 32 ... 222 71 34 90 43 175 25 9 63 38
AAMP 540 512 829 523 603 842 584 741 400 553 ... 1746 1507 1787 1238 428 1577 582 619 764 1199
AARS1 1230 1038 2124 1022 1616 2363 1263 1719 276 352 ... 1703 1464 1649 1398 754 1752 752 380 603 862
... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ...
107080638 281 221 502 264 408 517 274 359 138 132 ... 478 446 495 539 170 596 250 226 349 454
107080644 0 0 2 0 1 1 1 1 0 0 ... 3 0 3 4 0 0 0 0 3 0
BOLA2-SMG1P6 4 8 6 6 9 6 3 7 6 4 ... 22 29 39 9 3 23 7 5 4 7
107303344 126 96 230 81 165 200 145 161 33 25 ... 137 52 114 158 44 196 58 43 155 182
SCARNA18B 1 2 6 1 2 1 1 1 5 2 ... 2 1 0 0 0 0 0 0 9 6

16733 rows × 50 columns

In [543]:
#what is the average of highly transcribed genes 
a = tccounts[readcounts.sum(1)>30] / readcounts[readcounts.sum(1)>30]
a = a.fillna(0)
a = a.max(1).tolist()
a.sort()
sns.kdeplot(a)
Out[543]:
<matplotlib.axes._subplots.AxesSubplot at 0x7f74c580e400>
In [544]:
np.median(a)
Out[544]:
0.07321881740895825
In [546]:
readcounts.to_csv('../results/'+project+'/'+version+'_'+str(minvar_toremove)+'_'+str(mincount_toremove)+'_readcounts.csv',index=False)
tccounts.to_csv('../results/'+project+'/'+version+'_'+str(minvar_toremove)+'_'+str(mincount_toremove)+'_tccounts.csv',index=False)
In [410]:
readcounts = pd.read_csv('../results/'+project+'/'+version+'_'+str(minvar_toremove)+'_'+str(mincount_toremove)+'_readcounts.csv')
tccounts = pd.read_csv('../results/'+project+'/'+version+'_'+str(minvar_toremove)+'_'+str(mincount_toremove)+'_tccounts.csv')

make more dataframes

In [547]:
mtccounts = pd.DataFrame()
mreadcounts = pd.DataFrame()
for i in set([i.split('-')[2] for i in tccounts.columns]):
    mtccounts[i] = tccounts[[v for v in tccounts.columns if i in v]].mean(1)
    mreadcounts[i] = readcounts[[v for v in readcounts.columns if i in v]].mean(1)
In [548]:
mtccounts.to_csv("../results/"+project+'/'+version+'_'+str(minvar_toremove)+'_'+str(mincount_toremove)+"_mean_tccounts.csv")
mreadcounts.to_csv("../results/"+project+'/'+version+'_'+str(minvar_toremove)+'_'+str(mincount_toremove)+"_mean_readcounts.csv")
In [549]:
mtccounts = pd.DataFrame()
mreadcounts = pd.DataFrame()
for i in set([i.split('-')[2] for i in tccounts.columns]):
    mtccounts[i] = tccounts[[v for v in tccounts.columns if i in v]].median(1)
    mreadcounts[i] = readcounts[[v for v in readcounts.columns if i in v]].median(1)
In [550]:
mtccounts.to_csv("../results/"+project+'/'+version+'_'+str(minvar_toremove)+'_'+str(mincount_toremove)+"_median_tccounts.csv")
mreadcounts.to_csv("../results/"+project+'/'+version+'_'+str(minvar_toremove)+'_'+str(mincount_toremove)+"_median_readcounts.csv")
In [551]:
(tccounts/readcounts).fillna(0).to_csv("../results/"+project+'/'+version+'_'+str(minvar_toremove)+'_'+str(mincount_toremove)+"_tccounts_per_readcounts.csv")

lets look at the similarity accross replicates

we have some outliers, else it seems to make some sense and on average, to be extremelly similar!

In [552]:
tccounts.columns = [i.replace('-','.') for i in tccounts.columns]
readcounts.columns = [i.replace('-','.') for i in readcounts.columns]
In [86]:
mkdir ../results/$project/plots/
In [105]:
tccounts
Out[105]:
mr252.MV411_MEF2D.DMSO_2h.r1_tcount mr253.MV411_MEF2D.DMSO_2h.r2_tcount mr254.MV411_MEF2D.DMSO_2h.r3_tcount mr255.MV411_MEF2D.DMSO_2h.r4_tcount mr256.MV411_MEF2D.VHL_2h.r1_tcount mr257.MV411_MEF2D.VHL_2h.r2_tcount mr258.MV411_MEF2D.VHL_2h.r3_tcount mr259.MV411_MEF2D.VHL_2h.r4_tcount mr260.MV411_MEF2D.DMSO_24h.r1_tcount mr261.MV411_MEF2D.DMSO_24h.r2_tcount ... mr265.MV411_MEF2D.VHL_24h.r2_tcount mr266.MV411_MEF2D.VHL_24h.r3_tcount mr267.MV411_MEF2D.VHL_24h.r4_tcount mr268.MV411.PBS_24h.r1_tcount mr269.MV411.PBS_24h.r2_tcount mr270.MV411.PBS_24h.r3_tcount mr271.MV411.PBS_24h.r4_tcount mr272.MV411.MYBi_24h.r1_tcount mr273.MV411.MYBi_24h.r2_tcount mr274.MV411.MYBi_24h.r3_tcount
A1BG 0 0 0 0 0 0 0 0 0 0 ... 0 0 0 0 0 0 0 0 0 0
NAT1 4 3 18 25 3 0 3 21 5 0 ... 3 0 0 1 0 9 0 0 0 0
AAMP 7 5 17 10 5 1 11 19 18 0 ... 15 0 1 7 0 21 0 0 0 0
AARS1 13 11 18 25 12 4 9 57 35 2 ... 10 0 2 2 0 19 1 0 0 2
ABAT 1 1 2 3 0 0 0 5 6 0 ... 5 0 0 1 0 5 0 0 0 0
... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ...
107080638 0 2 1 9 1 0 3 3 5 0 ... 4 0 0 0 0 1 0 0 0 0
107080644 0 0 0 0 0 0 0 1 0 0 ... 1 0 0 0 0 0 0 0 0 0
BOLA2-SMG1P6 0 0 0 1 0 0 0 2 0 0 ... 4 0 0 0 0 0 0 0 0 0
107303344 1 0 2 1 1 0 0 1 0 0 ... 0 0 0 0 0 1 0 0 1 0
SCARNA18B 0 0 2 1 0 0 0 3 3 0 ... 0 0 0 0 0 0 0 0 4 0

16289 rows × 23 columns

In [106]:
(tccounts.loc["MYC"]/tccounts.mean(0)) /(readcounts.loc["MYC"]/readcounts.mean(0))
Out[106]:
mr252.MV411_MEF2D.DMSO_2h.r1_tcount     20.906873
mr253.MV411_MEF2D.DMSO_2h.r2_tcount     19.818364
mr254.MV411_MEF2D.DMSO_2h.r3_tcount     15.779573
mr255.MV411_MEF2D.DMSO_2h.r4_tcount     15.709042
mr256.MV411_MEF2D.VHL_2h.r1_tcount      16.630023
mr257.MV411_MEF2D.VHL_2h.r2_tcount      37.013294
mr258.MV411_MEF2D.VHL_2h.r3_tcount      22.111163
mr259.MV411_MEF2D.VHL_2h.r4_tcount      12.809547
mr260.MV411_MEF2D.DMSO_24h.r1_tcount    14.052167
mr261.MV411_MEF2D.DMSO_24h.r2_tcount    21.296080
mr262.MV411_MEF2D.DMSO_24h.r3_tcount    14.070035
mr263.MV411_MEF2D.DMSO_24h.r4_tcount    14.261005
mr264.MV411_MEF2D.VHL_24h.r1_tcount     19.960913
mr265.MV411_MEF2D.VHL_24h.r2_tcount     18.007882
mr266.MV411_MEF2D.VHL_24h.r3_tcount     37.545131
mr267.MV411_MEF2D.VHL_24h.r4_tcount     38.671184
mr268.MV411.PBS_24h.r1_tcount           15.098137
mr269.MV411.PBS_24h.r2_tcount           31.536246
mr270.MV411.PBS_24h.r3_tcount           11.012571
mr271.MV411.PBS_24h.r4_tcount           22.792705
mr272.MV411.MYBi_24h.r1_tcount          19.931377
mr273.MV411.MYBi_24h.r2_tcount           4.800348
mr274.MV411.MYBi_24h.r3_tcount           8.694439
dtype: float64
In [107]:
%matplotlib inline
sns.heatmap(tccounts.corr(), 
            xticklabels=tccounts.columns,
            yticklabels=tccounts.columns)
plt.savefig('../results/'+project+'/plots/'+version+'_similarity_replicates_sorted_readcounts.pdf')
In [108]:
%matplotlib inline
sns.heatmap(readcounts.corr(), 
            xticklabels=readcounts.columns,
            yticklabels=readcounts.columns)
plt.savefig('../results/'+project+'/plots/'+version+'_similarity_replicates.pdf')
In [110]:
%matplotlib inline
sns.heatmap(readcounts[readcounts.columns[:16]].corr(), 
            xticklabels=readcounts.columns[:16],
            yticklabels=readcounts.columns[:16])
plt.savefig('../results/'+project+'/plots/'+version+'_similarity_replicates_MYBi.pdf')

The change with DMSO (PBS) 30m vs 6h is as striking to as the change with MYBi highlighting the impact of batches

A quick detour to look for clustering

Getting the Core TF information

In [326]:
ctf=pd.read_csv('../data/CTF.csv',header=None)[0].values.tolist()
ctf
Out[326]:
['ARID2',
 'CEBPA',
 'CEBPE',
 'E2F3',
 'FLI1',
 'FOSL2',
 'GFI1',
 'GFI1B',
 'HHEX',
 'IRF8',
 'LYL1',
 'MEF2C',
 'MEF2D',
 'MEIS1',
 'MTF1',
 'MYB',
 'MYC',
 'PLAGL2',
 'RUNX1',
 'RUNX2',
 'RXRA',
 'SETDB1',
 'SNAPC5',
 'SP1',
 'SPI1',
 'SREBF1',
 'STAT5B',
 'TERF2',
 'TFAP4',
 'ZEB2',
 'ZFPM1',
 'ZMYND8',
 'LMO2',
 'MAX',
 'ELF2',
 'ETV6',
 'HOXA9',
 'GATA2']
In [327]:
set(ctf) & set(tccounts.index)
Out[327]:
{'ARID2',
 'CEBPA',
 'CEBPE',
 'E2F3',
 'ELF2',
 'ETV6',
 'FLI1',
 'FOSL2',
 'GATA2',
 'GFI1',
 'GFI1B',
 'HHEX',
 'HOXA9',
 'IRF8',
 'LMO2',
 'LYL1',
 'MAX',
 'MEF2C',
 'MEF2D',
 'MEIS1',
 'MTF1',
 'MYB',
 'MYC',
 'PLAGL2',
 'RUNX1',
 'RUNX2',
 'RXRA',
 'SETDB1',
 'SNAPC5',
 'SP1',
 'SPI1',
 'SREBF1',
 'STAT5B',
 'TERF2',
 'TFAP4',
 'ZEB2',
 'ZFPM1',
 'ZMYND8'}
In [328]:
ctfpos = [val for val in tccounts.index if val in ctf]
notctfpos = [val for val in tccounts.index if val not in ctf]
In [114]:
ctfpos.extend(['EGR1','SERTAD1'])

We find a CTF not in the dataset

Let's look at how they change accross time

how core transcription factors change accross time when the cell is with JQ1 conditions

we are looking at the difference between production of each CTF compared to the average RNA production with JQ1 and without JQ1

DESEQ ANALYSIS

In [553]:
readcounts["genes"] = readcounts.index
readcounts = readcounts.reset_index(drop=True)
tccounts["genes"] = tccounts.index
tccounts = tccounts.reset_index(drop=True)
<ipython-input-553-b760b2e1d27d>:1: SettingWithCopyWarning: 
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  readcounts["genes"] = readcounts.index
In [566]:
tccountsMEF2D= tccounts[tccounts.columns[-24:-8]]
designMEF2D2 = pd.DataFrame(index= [i.replace('-','.') for i in tccountsMEF2D.columns], 
                      columns=['DMSO','VHL'], 
                      data=np.array([[1,1,1,1,0,0,0,0,0,0,0,0,0,0,0,0],
                                     [0,0,0,0,1,1,1,1,0,0,0,0,0,0,0,0]],dtype=bool).T)
designMEF2D24 = pd.DataFrame(index=[i.replace('-','.') for i in tccountsMEF2D.columns], 
                      columns=['DMSO','VHL'], 
                      data=np.array([[0,0,0,0,0,0,0,0,1,1,1,1,0,0,0,0],
                                     [0,0,0,0,0,0,0,0,0,0,0,0,1,1,1,1]],dtype=bool).T)
In [573]:
### MYbi
tccountsMybi= tccounts[list(tccounts.columns[:15])+list(tccounts.columns[-8:-1])]
designMybi30 = pd.DataFrame(index= [i.replace('-','.') for i in tccountsMybi.columns], 
                      columns=['VHL','DMSO'], 
                      data=np.array([[1,1,1,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],
                                     [0,0,0,0,1,1,1,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0]],dtype=bool).T)
designMybi6 = pd.DataFrame(index=[i.replace('-','.') for i in tccountsMybi.columns], 
                      columns=['VHL','DMSO'], 
                      data=np.array([[0,0,0,0,0,0,0,0,1,1,1,1,0,0,0,0,0,0,0,0,0,0],
                                     [0,0,0,0,0,0,0,0,0,0,0,0,1,1,1,0,0,0,0,0,0,0]],dtype=bool).T)
designMybi24 = pd.DataFrame(index=[i.replace('-','.') for i in tccountsMybi.columns], 
                      columns=['DMSO','VHL'], 
                      data=np.array([[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,1,1,1,0,0,0],
                                     [0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,1,1]],dtype=bool).T)
In [580]:
### MYCi
tccountsMyci= tccounts[tccounts.columns[15:-24]]
designMS2 = pd.DataFrame(index=[i.replace('-','.') for i in tccountsMyci.columns], 
                      columns=['VHL','DMSO'], 
                      data=np.array([[1,1,1,0,0,0,0,0,0,0,0,0],
                                     [0,0,0,0,0,0,0,0,0,1,1,1]],dtype=bool).T)
designJQ1 = pd.DataFrame(index=[i.replace('-','.') for i in tccountsMyci.columns], 
                      columns=['VHL','DMSO'], 
                      data=np.array([[0,0,0,1,1,1,0,0,0,0,0,0],
                                     [0,0,0,0,0,0,0,0,0,1,1,1]],dtype=bool).T)
designMS2_JQ1 = pd.DataFrame(index=[i.replace('-','.') for i in tccountsMyci.columns], 
                      columns=['VHL','DMSO'], 
                      data=np.array([[0,0,0,0,0,0,1,1,1,0,0,0],
                                     [0,0,0,0,0,0,0,0,0,1,1,1]],dtype=bool).T)

Differential gene expression analysis, PCA and GO-term enrichment

For gene-level analysis, raw reads mapped to different UTR annotations of the same gene were summed up by Entrez Gene ID. Pilot studies of K562 cells with kinase inhibitors were performed as single experiments.

Analysis of differential gene expression was restricted to genes with ≥ 10 reads in at least one condition for 50bp sequencing runs (flavopiridol and DMSO) or ≥ 20 reads in at least one condition for 100bp sequencing runs (mk2206, trametinib, nilotinib, trametinib + mk2206 and DMSO). For estimating differential expression, a pseudo-count of 1 raw read was added to all genes.

All other SLAM-seq experiments were performed in triplicates and analyzed as follows.

Differential gene expression calling was performed on raw read counts with ≥ 2 T>C conversions using DESeq2 (version 1.14.1) with default settings, and with size factors estimated on corresponding total mRNA reads for global normalization.

Downstream analysis was restricted to genes passing all internal filters for FDR estimation by DESeq2. Principal component analysis was performed after variance stabilizing transformation on the 500 most variable genes across all conditions of a given experiment. GO-term enrichment analysis was performed on genes significantly and strongly downregulated (FDR ≤ 0.1, log2FC ≤ -1) in SLAM-seq upon IAA-treatment in K562MYC-AID + Tir1 by the PANTHER Overrepresentation Test (Fisher's Exact with FDR multiple test correction, release 20171205, http://pantherdb.org) on GO Ontology database Released 2017-12-27.

In [586]:
scaling="ERCCsamplewise"

MYCi

In [584]:
tccountsMyci= tccounts[list(tccountsMyci.columns)+['genes']]
MS2 = [1,1,1,0,0,0,0,0,0,1,1,1]
deseqMS2 = pyDESeq2.pyDESeq2(count_matrix=tccountsMyci[tccountsMyci.columns[np.array(MS2+[1],np.bool)]], design_matrix=designMS2[np.array(MS2,np.bool)],
                         design_formula="~DMSO - VHL",
                         gene_column="genes")
JQ1 = [0,0,0,1,1,1,0,0,0,1,1,1]
deseqJQ1 = pyDESeq2.pyDESeq2(count_matrix=tccountsMyci[tccountsMyci.columns[np.array(JQ1+[1],np.bool)]],
                         design_matrix=designJQ1[np.array(JQ1,np.bool)],
                         design_formula="~DMSO - VHL",
                         gene_column="genes")
MS2_JQ1 = [0,0,0,0,0,0,1,1,1,1,1,1]
deseqMS2_JQ1 = pyDESeq2.pyDESeq2(count_matrix=tccountsMyci[tccountsMyci.columns[np.array(MS2_JQ1+[1],np.bool)]],                     design_matrix=designMS2_JQ1[np.array(MS2_JQ1,np.bool)],
                         design_formula="~DMSO - VHL",
                         gene_column="genes")
3.3.2
3.3.2
3.3.2

Mybi

In [596]:
tccountsMybi= tccounts[list(tccountsMybi.columns)+['genes']]
Mybi30 = [1,1,1,1,1,1,1,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0]
deseqMybi30 = pyDESeq2.pyDESeq2(count_matrix = tccountsMybi[tccountsMybi.columns[np.array(Mybi30+[1],np.bool)]],
                         design_matrix=designMybi30[np.array(Mybi30,np.bool)],
                         design_formula="~DMSO - VHL",
                         gene_column="genes")
Mybi6 = [0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,0,0,0,0,0,0,0]
deseqMybi6 = pyDESeq2.pyDESeq2(count_matrix = tccountsMybi[tccountsMybi.columns[np.array(Mybi6+[1],np.bool)]],
                         design_matrix=designMybi6[np.array(Mybi6,np.bool)],
                         design_formula="~DMSO - VHL",
                         gene_column="genes")
Mybi24 = [0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,1,1,1,1,1,1]
deseqMybi24 = pyDESeq2.pyDESeq2(count_matrix=tccountsMybi[tccountsMybi.columns[np.array(Mybi24+[1],np.bool)]], design_matrix=designMybi24[np.array(Mybi24,np.bool)],
                         design_formula="~DMSO - VHL",
                         gene_column="genes")
3.3.2
3.3.2
3.3.2

MEF2D

In [597]:
MEF2D2 = [1,1,1,1,1,1,1,1,0,0,0,0,0,0,0,0]
tccountsMEF2D= tccounts[list(tccountsMEF2D.columns)+['genes']]
deseqMEF2D2 = pyDESeq2.pyDESeq2(count_matrix = tccountsMEF2D[tccountsMEF2D.columns[np.array(MEF2D2+[1],np.bool)]],
                         design_matrix=designMEF2D2[np.array(MEF2D2,np.bool)],
                         design_formula="~DMSO - VHL",
                         gene_column="genes")
MEF2D24 = [0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,1]
deseqMEF2D24 = pyDESeq2.pyDESeq2(count_matrix = tccountsMEF2D[tccountsMEF2D.columns[np.array(MEF2D24+[1],np.bool)]],
                         design_matrix=designMEF2D24[np.array(MEF2D24,np.bool)],
                         design_formula="~DMSO - VHL",
                         gene_column="genes")
3.3.2
3.3.2

estimating size factors

MYCi

In [599]:
readcountsMyci.columns
Out[599]:
Index(['mr208.MV411.MS2.r1_tcount', 'mr209.MV411.MS2.r2_tcount',
       'mr210.MV411.MS2.r3_tcount', 'mr211.MV411.JQ1.r1_tcount',
       'mr212.MV411.JQ1.r2_tcount', 'mr213.MV411.JQ1.r3_tcount',
       'mr214.MV411.MS2_JQ1.r1_tcount', 'mr215.MV411.MS2_JQ1.r2_tcount',
       'mr216.MV411.MS2_JQ1.r3_tcount', 'mr217.MV411.DMSO.r1_tcount',
       'mr218.MV411.DMSO.r2_tcount', 'mr219.MV411.DMSO.r3_tcount'],
      dtype='object')
In [601]:
deseqMS2.run_estimate_size_factors(geoMeans = np.exp(np.mean(np.log(
    readcounts[tccountsMyci.columns[np.array([1,1,1,0,0,0,0,0,0,0,0,0,0], np.bool)]].values+1), 1)))
deseqJQ1.run_estimate_size_factors(geoMeans = np.exp(np.mean(np.log(
    readcounts[tccountsMyci.columns[np.array([0,0,0,1,1,1,0,0,0,0,0,0,0], np.bool)]].values+1), 1)))
deseqMS2_JQ1.run_estimate_size_factors(geoMeans = np.exp(np.mean(np.log(
    readcounts[tccountsMyci.columns[np.array([0,0,0,0,0,0,1,1,1,0,0,0,0], np.bool)]].values+1), 1)))

MYBi

In [603]:
deseqMybi30.run_estimate_size_factors(geoMeans = np.exp(np.mean(np.log(readcounts[tccountsMybi.columns[np.array([1,1,1,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],np.bool)]].values+1),1)))
deseqMybi6.run_estimate_size_factors(geoMeans = np.exp(np.mean(np.log(readcounts[tccountsMybi.columns[np.array([0,0,0,0,0,0,0,0,1,1,1,1,0,0,0,0,0,0,0,0,0,0,0],np.bool)]].values+1),1)))
deseqMybi24.run_estimate_size_factors(geoMeans = np.exp(np.mean(np.log(readcounts[tccountsMybi.columns[np.array([0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,1,1,0], np.bool)]].values+1), 1)))

MEF2D

In [604]:
deseqMEF2D2.run_estimate_size_factors(geoMeans = np.exp(np.mean(np.log(readcounts[tccountsMEF2D.columns[
        np.array([0,0,0,0,1,1,1,1,0,0,0,0,0,0,0,0,0],np.bool)]].values+1),1)))
deseqMEF2D24.run_estimate_size_factors(geoMeans = np.exp(np.mean(np.log(readcounts[tccountsMEF2D.columns[
        np.array([0,0,0,0,0,0,0,0,0,0,0,0,1,1,1,1,0],np.bool)]].values+1),1)))

other size factor estimations

In [135]:
# from https://www.cell.com/trends/genetics/pdf/S0168-9525(13)00089-9.pdf FFROM THOUSANDS OF SAMPLES
housekeeping1 = ["C1orf43", "CHMP2A", "EMC7", "GPI", "PSMB2", "PSMB4", "RAB7A", "REEP5", "SNRPD3", "VCP", "VPS29"]

#https://www.ncbi.nlm.nih.gov/pmc/articles/PMC4760967/ FOR CANCER CELL LINES
housekeeping2 = ['18S rRNA',
'ACTB',
'B2M',
'G6PD',
'GAPDH',
'GUSB',
'HMBS',
'HPRT1',
'PGK1',
'PPIA',
'RPL13a',
'SDHA',
'TBP',
'TUBB',
'YWHAZ']
In [136]:
housekeeping = readcounts.genes.isin(housekeeping2)
In [139]:
readcountsMybi= readcounts[readcounts.columns[16:-1]]
np.exp(np.mean(np.log(
    readcountsMybi[readcountsMybi.columns[np.array([1,1,1,1,0,0,0], np.bool)]].values+1), 1))
Out[139]:
array([  2.37841423,  65.42519431, 836.23056631, ...,   9.36138928,
        95.49529375,   1.        ])
In [231]:
readcountsMybi= readcounts[readcounts.columns[16:-1]]

deseqMybi.run_estimate_size_factors(geoMeans = np.exp(np.mean(np.log(
    readcountsMybi[readcountsMybi.columns[np.array([1,1,1,1,0,0,0], np.bool)]].values+1), 1)), controlGenes=housekeeping)
In [232]:
readcountsMEF2D= readcounts[readcounts.columns[:16]]

deseqMEF2D2.run_estimate_size_factors(geoMeans = np.exp(np.mean(np.log(readcountsMEF2D[readcountsMEF2D.columns[
        np.array([1,1,1,1,0,0,0,0,0,0,0,0,0,0,0,0],np.bool)]].values+1),1)), controlGenes=housekeeping)
deseqMEF2D24.run_estimate_size_factors(geoMeans = np.exp(np.mean(np.log(readcountsMEF2D[readcountsMEF2D.columns[
        np.array([0,0,0,0,0,0,0,0,1,1,1,1,0,0,0,0],np.bool)]].values+1),1)), controlGenes=housekeeping)

Modifying size factors

In [402]:
r
Out[402]:
{'MYBi_30m': [0.5543739168045854, 0.1654583646526328],
 'PBS_30m': [0.2600444176284328, 0.02279444794903803],
 'MYBi_6h': [0.5005330862395866, 0.04428975746477769],
 'PBS_6h': [0.23903615815004206, 0.060942601783761284],
 'MS2': [0.14512165615335024, 0.054750165018263075],
 'JQ1': [0.10594775516310602, 0.025098518494594674],
 'MS2_JQ1': [0.20200435554076682, 0.0493267432253527],
 'DMSO': [0.14632946312395476, 0.011039982545173618]}
In [ ]:
#### MYCi
In [605]:
sizeFact = deseqJQ1.getSizeFactors()
In [606]:
sizeFact
Out[606]:
array([1.27881861, 0.69317453, 0.97956167, 1.32270785, 0.98099653,
       0.88753456])
In [618]:
sizeFact[:3] = sizeFact[:3]* (res[[i for i in res.index if '-JQ1-' in i]].values/res[[i for i in res.index if '-DMSO-' in i]].values.mean())
In [619]:
sizeFact
Out[619]:
array([0.57990844, 0.56386995, 0.92732798, 1.32270785, 0.98099653,
       0.88753456])
In [620]:
deseqJQ1.setSizeFactors(sizeFact)
In [621]:
sizeFact = deseqMS2_JQ1.getSizeFactors()
In [361]:
sizeFact
Out[361]:
array([0.91890327, 0.75221206, 1.38316058, 1.27587544, 0.9512112 ,
       0.86185077])
In [633]:
sizeFact[:3] = sizeFact[:3]*(res[[i for i in res.index if '-MS2_JQ1-' in i]].values/res[[i for i in res.index if '-DMSO-' in i]].values.mean())
In [623]:
sizeFact
Out[623]:
array([0.84096739, 1.48151564, 1.86315441, 1.27587544, 0.9512112 ,
       0.86185077])
In [624]:
deseqMS2_JQ1.setSizeFactors(sizeFact)
In [338]:
#### MYBi
In [625]:
sizeFact = deseqMybi30.getSizeFactors()
In [629]:
sizeFact[:4] = sizeFact[:4]*(res[[i for i in res.index if '-MYBi_30m-' in i]].values/res[[i for i in res.index if '-PBS_30m-' in i]].values.mean())
In [630]:
deseqMybi30.setSizeFactors(sizeFact)
In [635]:
sizeFact = deseqMybi6.getSizeFactors()
In [636]:
sizeFact[:4] = sizeFact[:4]*(res[[i for i in res.index if '-MYBi_6h-' in i]].values/res[[i for i in res.index if '-PBS_6h-' in i]].values.mean())
In [637]:
deseqMybi6.setSizeFactors(sizeFact)
In [640]:
sizeFact = deseqMybi24.getSizeFactors()
In [641]:
sizeFact
Out[641]:
array([1.78063546, 0.62894913, 7.31501961, 0.68994994, 0.29654006,
       0.98521363, 0.60556756])
In [643]:
sizeFact[4:] = sizeFact[4:]*(res[[i for i in res.index if '-MYBi_24h-' in i]].values/res[[i for i in res.index if '-PBS_24h-' in i]].values.mean())
In [645]:
deseqMybi24.setSizeFactors(sizeFact)
In [ ]:
#### MEF2D
In [646]:
sizeFact = deseqMEF2D24.getSizeFactors()
In [647]:
sizeFact[4:] = sizeFact[4:]*(res[[i for i in res.index if '-VHL_24h-' in i]].values/res[[i for i in res.index if '-DMSO_24h-' in i]].values.mean())
In [648]:
deseqMEF2D24.setSizeFactors(sizeFact)

running it

In [653]:
deseqMybi24.run_deseq()
deseqMybi24.get_deseq_result()
resMybi24 = deseqMybi24.deseq_result
resMybi24.pvalue = np.nan_to_num(np.array(resMybi24.pvalue), 1)
resMybi24.log2FoldChange = np.nan_to_num(np.array(resMybi24.log2FoldChange), 0)
resMybi24.log2FoldChange = -resMybi24.log2FoldChange
resMybi24["gene_id"] = resMybi24.genes
R[write to console]: using pre-existing size factors

R[write to console]: estimating dispersions

R[write to console]: gene-wise dispersion estimates

R[write to console]: mean-dispersion relationship

R[write to console]: final dispersion estimates

R[write to console]: fitting model and testing

In [650]:
deseqMEF2D2.run_deseq()
deseqMEF2D24.run_deseq()
deseqMEF2D2.get_deseq_result()
deseqMEF2D24.get_deseq_result()
resMEF2D2 = deseqMEF2D2.deseq_result
resMEF2D24 = deseqMEF2D24.deseq_result
resMEF2D2.pvalue = np.nan_to_num(np.array(resMEF2D2.pvalue), 1)
resMEF2D2.log2FoldChange = np.nan_to_num(np.array(resMEF2D2.log2FoldChange), 0)
resMEF2D24.pvalue = np.nan_to_num(np.array(resMEF2D24.pvalue), 1)
resMEF2D24.log2FoldChange = np.nan_to_num(np.array(resMEF2D24.log2FoldChange), 0)
resMEF2D24.log2FoldChange = -resMEF2D24.log2FoldChange
resMEF2D2.log2FoldChange = -resMEF2D2.log2FoldChange
resMEF2D2["gene_id"] = resMEF2D2.genes
resMEF2D24["gene_id"] = resMEF2D24.genes
R[write to console]: using pre-existing size factors

R[write to console]: estimating dispersions

R[write to console]: gene-wise dispersion estimates

R[write to console]: mean-dispersion relationship

R[write to console]: final dispersion estimates

R[write to console]: fitting model and testing

R[write to console]: using pre-existing size factors

R[write to console]: estimating dispersions

R[write to console]: gene-wise dispersion estimates

R[write to console]: mean-dispersion relationship

R[write to console]: final dispersion estimates

R[write to console]: fitting model and testing

In [651]:
deseqMS2.run_deseq()
deseqJQ1.run_deseq()
deseqMS2_JQ1.run_deseq()
deseqMS2.get_deseq_result()
deseqJQ1.get_deseq_result()
deseqMS2_JQ1.get_deseq_result()
resMS2 = deseqMS2.deseq_result
resJQ1 = deseqJQ1.deseq_result
resMS2_JQ1 = deseqMS2_JQ1.deseq_result
resMS2.pvalue = np.nan_to_num(np.array(resMS2.pvalue), 1)
resMS2.log2FoldChange = np.nan_to_num(np.array(resMS2.log2FoldChange), 0)
resJQ1.pvalue = np.nan_to_num(np.array(resJQ1.pvalue), 1)
resJQ1.log2FoldChange = np.nan_to_num(np.array(resJQ1.log2FoldChange), 0)
resMS2_JQ1.pvalue = np.nan_to_num(np.array(resMS2_JQ1.pvalue), 1)
resMS2_JQ1.log2FoldChange = np.nan_to_num(np.array(resMS2_JQ1.log2FoldChange), 0)
resMS2.log2FoldChange = -resMS2.log2FoldChange
resJQ1.log2FoldChange = -resJQ1.log2FoldChange
resMS2_JQ1.log2FoldChange = -resMS2_JQ1.log2FoldChange
resMS2["gene_id"] = resMS2.genes
resJQ1["gene_id"] = resJQ1.genes
resMS2_JQ1["gene_id"] = resMS2_JQ1.genes
R[write to console]: using pre-existing size factors

R[write to console]: estimating dispersions

R[write to console]: found already estimated dispersions, replacing these

R[write to console]: gene-wise dispersion estimates

R[write to console]: mean-dispersion relationship

R[write to console]: final dispersion estimates

R[write to console]: fitting model and testing

R[write to console]: using pre-existing size factors

R[write to console]: estimating dispersions

R[write to console]: found already estimated dispersions, replacing these

R[write to console]: gene-wise dispersion estimates

R[write to console]: mean-dispersion relationship

R[write to console]: final dispersion estimates

R[write to console]: fitting model and testing

R[write to console]: using pre-existing size factors

R[write to console]: estimating dispersions

R[write to console]: found already estimated dispersions, replacing these

R[write to console]: gene-wise dispersion estimates

R[write to console]: mean-dispersion relationship

R[write to console]: final dispersion estimates

R[write to console]: fitting model and testing

In [652]:
deseqMybi30.run_deseq()
deseqMybi6.run_deseq()
deseqMybi30.get_deseq_result()
deseqMybi6.get_deseq_result()
resMybi30 = deseqMybi30.deseq_result
resMybi6 = deseqMybi6.deseq_result
resMybi30.pvalue = np.nan_to_num(np.array(resMybi30.pvalue), 1)
resMybi30.log2FoldChange = np.nan_to_num(np.array(resMybi30.log2FoldChange), 0)
resMybi6.pvalue = np.nan_to_num(np.array(resMybi6.pvalue), 1)
resMybi6.log2FoldChange = np.nan_to_num(np.array(resMybi6.log2FoldChange), 0)
resMybi6.log2FoldChange = -resMybi6.log2FoldChange
resMybi30.log2FoldChange = -resMybi30.log2FoldChange
resMybi30["gene_id"] = resMybi30.genes
resMybi6["gene_id"] = resMybi6.genes
R[write to console]: using pre-existing size factors

R[write to console]: estimating dispersions

R[write to console]: gene-wise dispersion estimates

R[write to console]: mean-dispersion relationship

R[write to console]: final dispersion estimates

R[write to console]: fitting model and testing

R[write to console]: using pre-existing size factors

R[write to console]: estimating dispersions

R[write to console]: gene-wise dispersion estimates

R[write to console]: mean-dispersion relationship

R[write to console]: final dispersion estimates

R[write to console]: fitting model and testing

PLOTS

whisker's plots

In [141]:
%matplotlib inline
In [373]:
res = resMybi30[resMybi30.baseMean>10]
res.baseMean= np.log2(1+res.baseMean)
res["type"] = ['ctf' if i else "other" for i in  res.genes.isin(ctf)]
/home/jeremie/.local/lib/python3.8/site-packages/pandas/core/generic.py:5303: SettingWithCopyWarning: 
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  self[name] = value
<ipython-input-373-48ffebc3b001>:3: SettingWithCopyWarning: 
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  res["type"] = ['ctf' if i else "other" for i in  res.genes.isin(ctf)]
In [374]:
ax = sns.boxplot(data=res,x='type',y='log2FoldChange').set_title("Mybi at 30mn foldChange")
ax.figure.savefig('../results/'+project+"/plots/"+version+"_"+scaling+"_whiskersMybi_30mn_logfch.pdf")
In [375]:
ax =sns.boxplot(data=res,x='type',y='baseMean')
ax.set_title("Mybi 30mn baseMean")
ax.figure.savefig('../results/'+project+"/plots/"+version+"_"+scaling+"_whiskers_Mybi_30mn_baseMean.pdf")
In [376]:
res = resMybi6[resMybi6.baseMean>10]
res.baseMean= np.log2(1+res.baseMean)
res["type"] = ['ctf' if i else "other" for i in  res.genes.isin(ctf)]
/home/jeremie/.local/lib/python3.8/site-packages/pandas/core/generic.py:5303: SettingWithCopyWarning: 
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  self[name] = value
<ipython-input-376-82478fb37811>:3: SettingWithCopyWarning: 
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  res["type"] = ['ctf' if i else "other" for i in  res.genes.isin(ctf)]
In [377]:
ax= sns.boxplot(data=res,x='type',y='log2FoldChange')
ax.set_title("Mybi at 6h foldchange")
ax.figure.savefig('../results/'+project+"/plots/"+version+"_"+scaling+"_whiskers_Mybi_6h_logfch.pdf")
In [378]:
ax = sns.boxplot(data=res,x='type',y='baseMean')
ax.set_title("Mybi at 6h baseMean")
ax.figure.savefig('../results/'+project+"/plots/"+version+"_"+scaling+"_whiskers_Mybi_6h_baseMean.pdf")
In [379]:
res = resMybi[resMybi.baseMean>10]
res.baseMean= np.log2(1+res.baseMean)
res["type"] = ['ctf' if i else "other" for i in  res.genes.isin(ctf)]
/home/jeremie/.local/lib/python3.8/site-packages/pandas/core/generic.py:5303: SettingWithCopyWarning: 
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  self[name] = value
<ipython-input-379-9c3423f32532>:3: SettingWithCopyWarning: 
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  res["type"] = ['ctf' if i else "other" for i in  res.genes.isin(ctf)]
In [288]:
ax= sns.boxplot(data=res,x='type',y='log2FoldChange')
ax.set_title("Mybi at 24h foldchange")
ax.figure.savefig('../results/'+project+"/plots/"+version+"_"+scaling+"_whiskers_Mybi_24h_logfch.pdf")
In [289]:
ax = sns.boxplot(data=res,x='type',y='baseMean')
ax.set_title("Mybi at 24h baseMean")
ax.figure.savefig('../results/'+project+"/plots/"+version+"_"+scaling+"_whiskers_Mybi_24h_baseMean.pdf")

MEF2D

In [290]:
res = resMEF2D2[resMEF2D2.baseMean>10]
res.baseMean= np.log2(1+res.baseMean)
res["type"] = ['ctf' if i else "other" for i in  res.genes.isin(ctf)]
/home/jeremie/.local/lib/python3.8/site-packages/pandas/core/generic.py:5303: SettingWithCopyWarning: 
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  self[name] = value
<ipython-input-290-7dea2ee8b938>:3: SettingWithCopyWarning: 
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  res["type"] = ['ctf' if i else "other" for i in  res.genes.isin(ctf)]
In [291]:
ax= sns.boxplot(data=res,x='type',y='log2FoldChange')
ax.set_title("MEF2D at 2h foldchange")
ax.figure.savefig('../results/'+project+"/plots/"+version+"_"+scaling+"_whiskers_MEF2D_2h_logfch.pdf")
In [292]:
ax = sns.boxplot(data=res,x='type',y='baseMean')
ax.set_title("MEF2D at 2h baseMean")
ax.figure.savefig('../results/'+project+"/plots/"+version+"_"+scaling+"_whiskers_MEF2D_2h_baseMean.pdf")
In [293]:
res = resMEF2D24[resMEF2D24.baseMean>10]
res.baseMean= np.log2(1+res.baseMean)
res["type"] = ['ctf' if i else "other" for i in  res.genes.isin(ctf)]
/home/jeremie/.local/lib/python3.8/site-packages/pandas/core/generic.py:5303: SettingWithCopyWarning: 
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  self[name] = value
<ipython-input-293-bc2ba62415de>:3: SettingWithCopyWarning: 
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  res["type"] = ['ctf' if i else "other" for i in  res.genes.isin(ctf)]
In [294]:
ax= sns.boxplot(data=res,x='type',y='log2FoldChange')
ax.set_title("MEF2D at 24h foldchange")
ax.figure.savefig('../results/'+project+"/plots/"+version+"_"+scaling+"_whiskers_MEF2D_24h_logfch.pdf")
In [295]:
ax = sns.boxplot(data=res,x='type',y='baseMean')
ax.set_title("MEF2D at 24h baseMean")
ax.figure.savefig('../results/'+project+"/plots/"+version+"_"+scaling+"_whiskers_MEF2D_24h_baseMean.pdf")

Myci

In [380]:
res = resJQ1[resJQ1.baseMean>10]
res.baseMean= np.log2(1+res.baseMean)
res["type"] = ['ctf' if i else "other" for i in  res.genes.isin(ctf)]
<ipython-input-380-625ed54343ef>:3: SettingWithCopyWarning: 
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  res["type"] = ['ctf' if i else "other" for i in  res.genes.isin(ctf)]
In [381]:
ax = sns.boxplot(data=res,x='type',y='log2FoldChange')
ax.set_title("JQ1 foldchange")
ax.figure.savefig('../results/'+project+"/plots/"+version+"_"+scaling+"_whiskers_JQ1_logfch.pdf")
In [382]:
ax =sns.boxplot(data=res,x='type',y='baseMean')
ax.set_title("JQ1 base")
ax.figure.savefig('../results/'+project+"/plots/"+version+"_"+scaling+"_whiskers_JQ1_baseMean.pdf")
In [383]:
res = resMS2[resMS2.baseMean>10]
res.baseMean= np.log2(1+res.baseMean)
res["type"] = ['ctf' if i else "other" for i in  res.genes.isin(ctf)]
/home/jeremie/.local/lib/python3.8/site-packages/pandas/core/generic.py:5303: SettingWithCopyWarning: 
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  self[name] = value
<ipython-input-383-e69356b5065c>:3: SettingWithCopyWarning: 
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  res["type"] = ['ctf' if i else "other" for i in  res.genes.isin(ctf)]
In [384]:
ax =sns.boxplot(data=res,x='type',y='log2FoldChange')
ax.set_title("MS2 foldChange")
ax.figure.savefig('../results/'+project+"/plots/"+version+"_"+scaling+"_whiskers_MS2_logfch.pdf")
In [385]:
ax = sns.boxplot(data=res,x='type',y='baseMean')
ax.set_title("MS2 Base")
ax.figure.savefig('../results/'+project+"/plots/"+version+"_"+scaling+"_whiskers_MS2_baseMean.pdf")
In [386]:
res = resMS2_JQ1[resMS2_JQ1.baseMean>10]
res.baseMean= np.log2(1+res.baseMean)
res["type"] = ['ctf' if i else "other" for i in  res.genes.isin(ctf)]
/home/jeremie/.local/lib/python3.8/site-packages/pandas/core/generic.py:5303: SettingWithCopyWarning: 
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  self[name] = value
<ipython-input-386-3a7f333fb32e>:3: SettingWithCopyWarning: 
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  res["type"] = ['ctf' if i else "other" for i in  res.genes.isin(ctf)]
In [387]:
ax = sns.boxplot(data=res,x='type',y='log2FoldChange')
ax.set_title("MS2+JQ1 foldChange")
ax.figure.savefig('../results/'+project+"/plots/"+version+"_"+scaling+"_whiskers_MS2_JQ1_logfch.pdf")
In [388]:
ax = sns.boxplot(data=res,x='type',y='baseMean')
ax.set_title("MS2+JQ1 Base")
ax.figure.savefig('../results/'+project+"/plots/"+version+"_"+scaling+"_whiskers_MS2_JQ1_baseMean.pdf")

Scatter plot comparison

In [389]:
mix = pd.DataFrame()
mix["gene_id"] = resMybi30["gene_id"]
mix['Mybi 30mn'] = resMybi30.log2FoldChange
mix['Mybi 6h'] = resMybi6.log2FoldChange
In [390]:
scatter(mix[['Mybi 30mn','Mybi 6h']].values[:12000], 
               mix['gene_id'].values.tolist()[:12000], radi= 0.06, alpha=0.3,
              colors = [0 if i in ctf else 1 for i in mix['gene_id'].values.tolist()[:12000]],
       xname="Mybi 30mn",
    yname="Mybi 6h",
       folder='../results/'+project+"/plots/"+version+"_"+scaling+"_",
       title='Mybi 30mn vs 6h differences in logFoldChange')
Out[390]:
Figure(
id = '5724', …)

Regular volcanos

In [654]:
resMS2.to_csv("../results/"+project+"/"+version+'_'+scaling+"_"+str(minvar_toremove)+'_'+str(mincount_toremove)+'_MS2_deseq.csv')
resJQ1.to_csv("../results/"+project+"/"+version+'_'+scaling+"_"+str(minvar_toremove)+'_'+str(mincount_toremove)+'_JQ1_deseq.csv')
resMS2_JQ1.to_csv("../results/"+project+"/"+version+'_'+scaling+"_"+str(minvar_toremove)+'_'+str(mincount_toremove)+'_MS2_JQ1_deseq.csv')
In [655]:
resMybi30.to_csv("../results/"+project+"/"+version+'_'+scaling+'_'+str(minvar_toremove)+'_'+str(mincount_toremove)+'_Mybi_30um_deseq.csv')
resMybi6.to_csv("../results/"+project+"/"+version+'_'+scaling+'_'+str(minvar_toremove)+'_'+str(mincount_toremove)+'_Mybi_6h_deseq.csv')
In [658]:
resMybi24.to_csv("../results/"+project+"/"+version+'_'+scaling+'_'+str(minvar_toremove)+'_'+str(mincount_toremove)+'_Mybi_24h_deseq.csv')
In [657]:
resMEF2D2.to_csv("../results/"+project+"/"+version+'_'+scaling+'_'+str(minvar_toremove)+'_'+str(mincount_toremove)+'_MEF2D_2h_deseq.csv')
resMEF2D24.to_csv("../results/"+project+"/"+version+'_'+scaling+'_'+str(minvar_toremove)+'_'+str(mincount_toremove)+'_MEF2D_24h_deseq.csv')

we can conclude that we get similar results to the slamseq myc paper although it seems that our values are a bit skewed toward higher expression than what is on the slamseq paper. It mightt be explained by the pseudo count of 1 that I did not set. Because I think it would highly bias the DESeq algorithm.

In [659]:
show(volcano(resMS2,tohighlight=ctf, searchbox=True, title='DESeq results of MV411 under MS2 in volcano plot', folder='../results/'+project+'/plots/'+version+'_'+scaling+"_"+str(minvar_toremove)+'_'+str(mincount_toremove)))
show(volcano(resJQ1,tohighlight=ctf, searchbox=True, title='DESeq results of MV411 under JQ1 in volcano plot', folder='../results/'+project+'/plots/'+version+'_'+scaling+"_"+str(minvar_toremove)+'_'+str(mincount_toremove)))
show(volcano(resMS2_JQ1,tohighlight=ctf, searchbox=True, title='DESeq results of MV411 under MS2 and JQ1 in volcano plot', folder='../results/'+project+'/plots/'+version+'_'+scaling+"_"+str(minvar_toremove)+'_'+str(mincount_toremove)))

Mybi

In [660]:
show(volcano(resMybi30,tohighlight=ctf, searchbox=True, title="Mybi at 30mn", folder='../results/'+project+'/plots/'+version+'_'+scaling+"_"+str(minvar_toremove)+'_'+str(mincount_toremove)))
In [661]:
show(volcano(resMybi6,tohighlight=ctf, searchbox=True, title="Mybi at 6h", folder='../results/'+project+'/plots/'+version+'_'+scaling+"_"+str(minvar_toremove)+'_'+str(mincount_toremove),maxvalue=50))
In [662]:
show(volcano(resMybi24,tohighlight=ctf, searchbox=True, title="Mybi at 24h", folder='../results/'+project+'/plots/'+version+'_'+scaling+"_"+str(minvar_toremove)+'_'+str(mincount_toremove),maxvalue=50))

MEF2D

In [663]:
show(volcano(resMEF2D2,tohighlight=ctf, searchbox=True, title="MEF2D at 2h", folder='../results/'+project+'/plots/'+version+'_'+scaling+"_"+str(minvar_toremove)+'_'+str(mincount_toremove),maxvalue=50))
show(volcano(resMEF2D24,tohighlight=ctf, searchbox=True, title="MEF2D at 24h", folder='../results/'+project+'/plots/'+version+'_'+scaling+"_"+str(minvar_toremove)+'_'+str(mincount_toremove),maxvalue=50))

Readcounts version

In [664]:
%store res

%store tccounts
%store readcounts

%store tccountsMyci
%store tccountsMybi
%store tccountsMEF2D

%store designMS2
%store designJQ1
%store designMS2_JQ1

%store designMybi30
%store designMybi6
%store designMybi24

%store designMEF2D2
%store designMEF2D24

%store ctf

%store resMEF2D24
%store resMEF2D2
Stored 'res' (Series)
Stored 'tccounts' (DataFrame)
Stored 'readcounts' (DataFrame)
Stored 'tccountsMyci' (DataFrame)
Stored 'tccountsMybi' (DataFrame)
Stored 'tccountsMEF2D' (DataFrame)
Stored 'designMS2' (DataFrame)
Stored 'designJQ1' (DataFrame)
Stored 'designMS2_JQ1' (DataFrame)
Stored 'designMybi30' (DataFrame)
Stored 'designMybi6' (DataFrame)
Stored 'designMybi24' (DataFrame)
Stored 'designMEF2D2' (DataFrame)
Stored 'designMEF2D24' (DataFrame)
In [ ]: